{"id":"https://openalex.org/W3214718962","doi":"https://doi.org/10.1109/lca.2021.3126450","title":"Near-Data Processing in Memory Expander for DNN Acceleration on GPUs","display_name":"Near-Data Processing in Memory Expander for DNN Acceleration on GPUs","publication_year":2021,"publication_date":"2021-07-01","ids":{"openalex":"https://openalex.org/W3214718962","doi":"https://doi.org/10.1109/lca.2021.3126450","mag":"3214718962"},"language":"en","primary_location":{"id":"doi:10.1109/lca.2021.3126450","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lca.2021.3126450","pdf_url":null,"source":{"id":"https://openalex.org/S17643076","display_name":"IEEE Computer Architecture Letters","issn_l":"1556-6056","issn":["1556-6056","1556-6064","2473-2575"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computer Architecture Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074288663","display_name":"Hyungkyu Ham","orcid":"https://orcid.org/0000-0002-4989-2834"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Hyungkyu Ham","raw_affiliation_strings":["Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057504898","display_name":"Hyunuk Cho","orcid":"https://orcid.org/0000-0002-1554-1884"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyunuk Cho","raw_affiliation_strings":["Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100340264","display_name":"Minjae Kim","orcid":"https://orcid.org/0000-0002-6369-245X"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Minjae Kim","raw_affiliation_strings":["Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023909110","display_name":"Jueon Park","orcid":"https://orcid.org/0000-0003-4824-0698"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jueon Park","raw_affiliation_strings":["Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062791122","display_name":"Jeongmin Hong","orcid":"https://orcid.org/0000-0002-5492-5346"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jeongmin Hong","raw_affiliation_strings":["Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005051912","display_name":"Hyojin Sung","orcid":"https://orcid.org/0000-0002-3036-6180"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyojin Sung","raw_affiliation_strings":["Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064884832","display_name":"Eunhyeok Park","orcid":"https://orcid.org/0000-0002-7331-9819"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Eunhyeok Park","raw_affiliation_strings":["Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039338759","display_name":"Euicheol Lim","orcid":"https://orcid.org/0000-0002-8910-533X"},"institutions":[{"id":"https://openalex.org/I134353371","display_name":"SK Group (South Korea)","ror":"https://ror.org/03696td91","country_code":"KR","type":"company","lineage":["https://openalex.org/I134353371"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Euicheol Lim","raw_affiliation_strings":["SK Hynix, Icheon, Gyeonggi, South Korea"],"affiliations":[{"raw_affiliation_string":"SK Hynix, Icheon, Gyeonggi, South Korea","institution_ids":["https://openalex.org/I134353371"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100334897","display_name":"Gwangsun Kim","orcid":"https://orcid.org/0000-0001-5749-5794"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Gwangsun Kim","raw_affiliation_strings":["Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5074288663"],"corresponding_institution_ids":["https://openalex.org/I123900574"],"apc_list":null,"apc_paid":null,"fwci":0.4048,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.61762306,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"20","issue":"2","first_page":"171","last_page":"174"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8963940143585205},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6454553604125977},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5581296682357788},{"id":"https://openalex.org/keywords/memory-controller","display_name":"Memory controller","score":0.5394696593284607},{"id":"https://openalex.org/keywords/memory-architecture","display_name":"Memory architecture","score":0.5315834283828735},{"id":"https://openalex.org/keywords/in-memory-processing","display_name":"In-Memory Processing","score":0.47658655047416687},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.47300177812576294},{"id":"https://openalex.org/keywords/interleaved-memory","display_name":"Interleaved memory","score":0.4264909327030182},{"id":"https://openalex.org/keywords/cas-latency","display_name":"CAS latency","score":0.422294557094574},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.40086984634399414},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.3644048571586609},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.30156612396240234},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2826935052871704},{"id":"https://openalex.org/keywords/semiconductor-memory","display_name":"Semiconductor memory","score":0.18945109844207764}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8963940143585205},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6454553604125977},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5581296682357788},{"id":"https://openalex.org/C100800780","wikidata":"https://www.wikidata.org/wiki/Q1175867","display_name":"Memory controller","level":3,"score":0.5394696593284607},{"id":"https://openalex.org/C2779602883","wikidata":"https://www.wikidata.org/wiki/Q15544750","display_name":"Memory architecture","level":2,"score":0.5315834283828735},{"id":"https://openalex.org/C123593499","wikidata":"https://www.wikidata.org/wiki/Q6008583","display_name":"In-Memory Processing","level":5,"score":0.47658655047416687},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.47300177812576294},{"id":"https://openalex.org/C63511323","wikidata":"https://www.wikidata.org/wiki/Q908936","display_name":"Interleaved memory","level":4,"score":0.4264909327030182},{"id":"https://openalex.org/C189930140","wikidata":"https://www.wikidata.org/wiki/Q1112878","display_name":"CAS latency","level":4,"score":0.422294557094574},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.40086984634399414},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.3644048571586609},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.30156612396240234},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2826935052871704},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.18945109844207764},{"id":"https://openalex.org/C194222762","wikidata":"https://www.wikidata.org/wiki/Q114486","display_name":"Query by Example","level":4,"score":0.0},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.0},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.0},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lca.2021.3126450","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lca.2021.3126450","pdf_url":null,"source":{"id":"https://openalex.org/S17643076","display_name":"IEEE Computer Architecture Letters","issn_l":"1556-6056","issn":["1556-6056","1556-6064","2473-2575"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computer Architecture Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8318857934","display_name":null,"funder_award_id":"NRF-2019R1C1C1009790","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320317879","display_name":"SK Hynix","ror":null},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1836465849","https://openalex.org/W1985818188","https://openalex.org/W2034861439","https://openalex.org/W2194775991","https://openalex.org/W2464177207","https://openalex.org/W2903754802","https://openalex.org/W2963163009","https://openalex.org/W2979719709","https://openalex.org/W3042495273","https://openalex.org/W3043023836","https://openalex.org/W3043443960","https://openalex.org/W3100710793","https://openalex.org/W3102510044","https://openalex.org/W3113606433","https://openalex.org/W6637373629","https://openalex.org/W6638667902","https://openalex.org/W6719768283"],"related_works":["https://openalex.org/W3008068282","https://openalex.org/W2896161911","https://openalex.org/W2185658074","https://openalex.org/W4285245242","https://openalex.org/W2951921863","https://openalex.org/W1980136882","https://openalex.org/W1707075782","https://openalex.org/W1979830285","https://openalex.org/W3049130895","https://openalex.org/W2155643858"],"abstract_inverted_index":{"We":[0],"propose":[1],"a":[2,9,70,78,103],"near-data":[3],"processing":[4],"(NDP)":[5],"architecture":[6,26],"that":[7],"exploits":[8],"memory":[10,33,49],"expander":[11],"with":[12,65,109],"byte-addressable":[13],"memory-semantic":[14],"interconnect":[15],"to":[16],"accelerate":[17],"memory-bound":[18,54],"operations":[19,30,55,67,76],"in":[20],"deep":[21,96],"neural":[22],"networks":[23],"(DNNs).":[24],"Our":[25,99],"can":[27,61,84,101],"execute":[28],"NDP":[29,42,59,82],"on":[31,57,69],"the":[32,36,45,53,58,74,81,89],"traffic":[34],"from":[35],"GPU":[37],"on-the-fly":[38],"by":[39,88,95],"employing":[40],"bump-in-the-wire":[41],"logic":[43],"between":[44],"off-chip":[46],"link":[47],"and":[48],"controller.":[50],"In":[51],"addition,":[52],"executed":[56,68],"unit":[60],"be":[62,85],"effectively":[63],"overlapped":[64],"compute-intensive":[66],"GPU,":[71],"even":[72],"if":[73],"two":[75],"have":[77],"dependency.":[79],"Furthermore,":[80],"offloading":[83],"automatically":[86],"done":[87],"compiler":[90],"without":[91],"any":[92],"code":[93],"modification":[94],"learning":[97],"practitioners.":[98],"approach":[100],"achieve":[102],"51%":[104],"speedup":[105],"for":[106],"training":[107],"VGG-16":[108],"batch":[110],"normalization.":[111]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
