{"id":"https://openalex.org/W3174762441","doi":"https://doi.org/10.1145/3460971","title":"High-throughput Near-Memory Processing on CNNs with 3D HBM-like Memory","display_name":"High-throughput Near-Memory Processing on CNNs with 3D HBM-like Memory","publication_year":2021,"publication_date":"2021-06-28","ids":{"openalex":"https://openalex.org/W3174762441","doi":"https://doi.org/10.1145/3460971","mag":"3174762441"},"language":"en","primary_location":{"id":"doi:10.1145/3460971","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3460971","pdf_url":null,"source":{"id":"https://openalex.org/S105046310","display_name":"ACM Transactions on Design Automation of Electronic Systems","issn_l":"1084-4309","issn":["1084-4309","1557-7309"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Design Automation of Electronic Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019501792","display_name":"Naebeom Park","orcid":"https://orcid.org/0000-0003-0947-9145"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Naebeom Park","raw_affiliation_strings":["Pohang University of Science and Technology, Pohang"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology, Pohang","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079596428","display_name":"Sungju Ryu","orcid":"https://orcid.org/0000-0002-0254-391X"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sungju Ryu","raw_affiliation_strings":["Pohang University of Science and Technology, Pohang"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology, Pohang","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079872127","display_name":"Jaeha Kung","orcid":"https://orcid.org/0000-0001-6151-8602"},"institutions":[{"id":"https://openalex.org/I193352282","display_name":"Daegu Gyeongbuk Institute of Science and Technology","ror":"https://ror.org/03frjya69","country_code":"KR","type":"education","lineage":["https://openalex.org/I193352282"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaeha Kung","raw_affiliation_strings":["DGIST, Daegu"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DGIST, Daegu","institution_ids":["https://openalex.org/I193352282"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003219699","display_name":"Jae\u2010Joon Kim","orcid":"https://orcid.org/0000-0001-5175-8258"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jae-Joon Kim","raw_affiliation_strings":["Pohang University of Science and Technology, Pohang"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology, Pohang","institution_ids":["https://openalex.org/I123900574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.2204,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.78729654,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"26","issue":"6","first_page":"1","last_page":"20"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8888775706291199},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.7008936405181885},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.46679219603538513},{"id":"https://openalex.org/keywords/registered-memory","display_name":"Registered memory","score":0.4509182274341583},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.4382655620574951},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.4343092441558838},{"id":"https://openalex.org/keywords/computer-memory","display_name":"Computer memory","score":0.4207392930984497},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.41032516956329346},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.37222325801849365},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.35403603315353394},{"id":"https://openalex.org/keywords/semiconductor-memory","display_name":"Semiconductor memory","score":0.3143951892852783},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.1273777186870575},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.08048474788665771}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8888775706291199},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.7008936405181885},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.46679219603538513},{"id":"https://openalex.org/C93446704","wikidata":"https://www.wikidata.org/wiki/Q449328","display_name":"Registered memory","level":3,"score":0.4509182274341583},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.4382655620574951},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.4343092441558838},{"id":"https://openalex.org/C92855701","wikidata":"https://www.wikidata.org/wiki/Q5830907","display_name":"Computer memory","level":3,"score":0.4207392930984497},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.41032516956329346},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.37222325801849365},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.35403603315353394},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.3143951892852783},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.1273777186870575},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.08048474788665771},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3460971","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3460971","pdf_url":null,"source":{"id":"https://openalex.org/S105046310","display_name":"ACM Transactions on Design Automation of Electronic Systems","issn_l":"1084-4309","issn":["1084-4309","1557-7309"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Design Automation of Electronic Systems","raw_type":"journal-article"},{"id":"pmh:oai:oasis.postech.ac.kr:2014.oak/110870","is_oa":false,"landing_page_url":"https://oasis.postech.ac.kr/handle/2014.oak/110870","pdf_url":null,"source":{"id":"https://openalex.org/S4306401965","display_name":"Open Access System for Information Sharing (Pohang University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I123900574","host_organization_name":"Pohang University of Science and Technology","host_organization_lineage":["https://openalex.org/I123900574"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.9100000262260437}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1487583988","https://openalex.org/W1981220134","https://openalex.org/W2048266589","https://openalex.org/W2094756095","https://openalex.org/W2108598243","https://openalex.org/W2133834148","https://openalex.org/W2194775991","https://openalex.org/W2257979135","https://openalex.org/W2285660444","https://openalex.org/W2289252105","https://openalex.org/W2474451066","https://openalex.org/W2518511512","https://openalex.org/W2520782513","https://openalex.org/W2575705757","https://openalex.org/W2582737986","https://openalex.org/W2585720638","https://openalex.org/W2593564159","https://openalex.org/W2604319603","https://openalex.org/W2606722458","https://openalex.org/W2742947407","https://openalex.org/W2761132374","https://openalex.org/W2769856846","https://openalex.org/W2790546557","https://openalex.org/W2921918777","https://openalex.org/W2953212265","https://openalex.org/W2964988320","https://openalex.org/W2982083293","https://openalex.org/W3105314253","https://openalex.org/W4244457258","https://openalex.org/W4246587277"],"related_works":["https://openalex.org/W4242495027","https://openalex.org/W2898989424","https://openalex.org/W4293159259","https://openalex.org/W2019238062","https://openalex.org/W4285257158","https://openalex.org/W2354036839","https://openalex.org/W4238754064","https://openalex.org/W2100773763","https://openalex.org/W2561005478","https://openalex.org/W2136268150"],"abstract_inverted_index":{"This":[0],"article":[1],"discusses":[2],"the":[3,12,27,37,48,64,68,76,93,97,107,114,119,135,148,152,159],"high-performance":[4],"near-memory":[5,32,58],"neural":[6],"network":[7],"(NN)":[8],"accelerator":[9,34,60],"architecture":[10],"utilizing":[11],"logic":[13],"die":[14],"in":[15,55,125],"three-dimensional":[16],"(3D)":[17],"High":[18],"Bandwidth":[19],"Memory\u2013":[20],"(HBM)":[21],"like":[22],"memory.":[23],"As":[24],"most":[25],"of":[26,57,63,113,134],"previously":[28],"reported":[29],"3D":[30,70],"memory-based":[31],"NN":[33,59],"designs":[35,124],"used":[36],"Hybrid":[38],"Memory":[39],"Cube":[40],"(HMC)":[41],"memory,":[42],"we":[43,95],"first":[44],"focus":[45],"on":[46,92,156,164],"identifying":[47],"key":[49],"differences":[50,66],"between":[51,67],"HBM":[52,74],"and":[53,101,131,158],"HMC":[54,83],"terms":[56],"design.":[61],"One":[62],"major":[65],"two":[69],"memories":[71],"is":[72],"that":[73,147],"has":[75,84],"centralized":[77,108],"through-":[78],"silicon-via":[79],"(TSV)":[80],"channels":[81,87,110],"while":[82],"distributed":[85],"TSV":[86,109],"for":[88,111,118],"separate":[89],"vaults.":[90],"Based":[91],"observation,":[94],"introduce":[96],"Round-Robin":[98],"Data":[99],"Fetching":[100],"Groupwise":[102],"Broadcast":[103],"schemes":[104,150],"to":[105,167],"exploit":[106],"improvement":[112],"data":[115,169],"feeding":[116],"rate":[117],"processing":[120],"elements.":[121],"Using":[122],"synthesized":[123],"a":[126],"28-nm":[127],"CMOS":[128],"technology,":[129],"performance":[130],"energy":[132,160],"consumption":[133,161],"proposed":[136,149],"architectures":[137],"with":[138],"various":[139],"dataflow":[140],"models":[141],"are":[142],"evaluated.":[143],"Experimental":[144],"results":[145],"show":[146],"reduce":[151],"runtime":[153],"by":[154,162],"16.4\u201339.3%":[155],"average":[157,165],"2.1\u20135.1%":[163],"compared":[166],"conventional":[168],"fetching":[170],"schemes.":[171]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
