{"id":"https://openalex.org/W4318685379","doi":"https://doi.org/10.1145/3566097.3567857","title":"An Efficient near-Bank Processing Architecture for Personalized Recommendation System","display_name":"An Efficient near-Bank Processing Architecture for Personalized Recommendation System","publication_year":2023,"publication_date":"2023-01-16","ids":{"openalex":"https://openalex.org/W4318685379","doi":"https://doi.org/10.1145/3566097.3567857"},"language":"en","primary_location":{"id":"doi:10.1145/3566097.3567857","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3566097.3567857","pdf_url":null,"source":{"id":"https://openalex.org/S4363608968","display_name":"Proceedings of the 28th Asia and South Pacific Design Automation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th Asia and South Pacific Design Automation Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101421201","display_name":"Yuqing Yang","orcid":"https://orcid.org/0000-0003-3518-5212"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuqing Yang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103222478","display_name":"Weidong Yang","orcid":"https://orcid.org/0000-0003-3610-2343"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weidong Yang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100725058","display_name":"Qin Wang","orcid":"https://orcid.org/0000-0001-7081-6580"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qin Wang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045693138","display_name":"Naifeng Jing","orcid":"https://orcid.org/0000-0001-8417-5796"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Naifeng Jing","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008057183","display_name":"Jianfei Jiang","orcid":"https://orcid.org/0000-0002-5521-6197"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianfei Jiang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103236320","display_name":"Zhigang Mao","orcid":"https://orcid.org/0000-0001-9431-9853"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhigang Mao","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043703962","display_name":"Weiguang Sheng","orcid":"https://orcid.org/0000-0002-7831-526X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weiguang Sheng","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101421201"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05797101,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"122","last_page":"127"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dram","display_name":"Dram","score":0.8060588836669922},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.79981929063797},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6958012580871582},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.6667901277542114},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.6150894165039062},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5759793519973755},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5458014011383057},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.5205736756324768},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4916704297065735},{"id":"https://openalex.org/keywords/memory-architecture","display_name":"Memory architecture","score":0.4690416753292084},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.45860323309898376},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.40426284074783325},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.2950761914253235},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.13270464539527893},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.07178592681884766}],"concepts":[{"id":"https://openalex.org/C7366592","wikidata":"https://www.wikidata.org/wiki/Q1255620","display_name":"Dram","level":2,"score":0.8060588836669922},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.79981929063797},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6958012580871582},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.6667901277542114},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.6150894165039062},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5759793519973755},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5458014011383057},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.5205736756324768},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4916704297065735},{"id":"https://openalex.org/C2779602883","wikidata":"https://www.wikidata.org/wiki/Q15544750","display_name":"Memory architecture","level":2,"score":0.4690416753292084},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.45860323309898376},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.40426284074783325},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.2950761914253235},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.13270464539527893},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.07178592681884766},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3566097.3567857","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3566097.3567857","pdf_url":null,"source":{"id":"https://openalex.org/S4363608968","display_name":"Proceedings of the 28th Asia and South Pacific Design Automation Conference","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th Asia and South Pacific Design Automation Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8799999952316284,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1981943579","https://openalex.org/W2034861439","https://openalex.org/W2040367556","https://openalex.org/W2086112773","https://openalex.org/W2518511512","https://openalex.org/W2979719709","https://openalex.org/W2985229340","https://openalex.org/W3016842236","https://openalex.org/W3042598257","https://openalex.org/W3043023836","https://openalex.org/W3187188899"],"related_works":["https://openalex.org/W2891987081","https://openalex.org/W4376647684","https://openalex.org/W4205208341","https://openalex.org/W2106019019","https://openalex.org/W2543610639","https://openalex.org/W2128337014","https://openalex.org/W2993780376","https://openalex.org/W2978553361","https://openalex.org/W2909135646","https://openalex.org/W2121559452"],"abstract_inverted_index":{"Personalized":[0],"recommendation":[1,28,56,97,175],"systems":[2],"consume":[3],"the":[4,25,32,55,60,69,101,110,117,147,170],"major":[5],"resources":[6],"in":[7,65,84],"modern":[8],"AI":[9],"data":[10,167],"centers.":[11],"The":[12],"memory-bound":[13],"embedding":[14,81,135],"layers":[15,82,136],"with":[16],"irregular":[17],"memory":[18,33,104],"access":[19],"patterns":[20],"have":[21],"been":[22],"identified":[23],"as":[24],"bottleneck":[26],"of":[27,80,109,149],"systems.":[29],"To":[30],"overcome":[31],"challenges,":[34],"near-memory":[35],"processing":[36,93],"(NMP)":[37],"would":[38],"be":[39],"an":[40,50,141],"effective":[41],"solution":[42,173],"which":[43,121],"provides":[44],"high":[45],"bandwidth.":[46,127,151],"Recent":[47],"work":[48],"proposes":[49],"NMP":[51,172],"approach":[52],"to":[53,95,145,159],"accelerate":[54,96],"models":[57],"by":[58,73],"utilizing":[59],"through-silicon":[61],"via":[62],"(TSV)":[63],"bandwidth":[64,71,120],"3D-stacked":[66,111,179],"DRAMs.":[67],"However,":[68],"total":[70],"provided":[72],"TSVs":[74],"is":[75,122],"insufficient":[76],"for":[77,134,166,174],"a":[78,91,131,153],"batch":[79],"processed":[83],"parallel.":[85],"In":[86],"this":[87],"paper,":[88],"we":[89,139],"propose":[90,140],"near-bank":[92],"architecture":[94,114,156],"models.":[98],"By":[99],"integrating":[100],"compute-logic":[102],"near":[103],"banks":[105],"on":[106,178],"DRAM":[107],"dies":[108],"DRAM,":[112],"our":[113,155],"can":[115],"exploit":[116],"enormous":[118],"bank-level":[119,150],"much":[123],"higher":[124],"than":[125],"TSV":[126],"We":[128],"also":[129],"present":[130],"hardware/software":[132],"interface":[133],"offloading.":[137],"Moreover,":[138],"efficient":[142],"mapping":[143],"scheme":[144],"enhance":[146],"utilization":[148],"As":[152],"result,":[154],"achieves":[157],"up":[158],"2.10X":[160],"speedup":[161],"and":[162],"31%":[163],"energy":[164],"saving":[165],"movement":[168],"over":[169],"state-of-the-art":[171],"acceleration":[176],"based":[177],"memory.":[180]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
