{"id":"https://openalex.org/W2920081941","doi":"https://doi.org/10.1109/tc.2019.2903055","title":"NNPIM: A Processing In-Memory Architecture for Neural Network Acceleration","display_name":"NNPIM: A Processing In-Memory Architecture for Neural Network Acceleration","publication_year":2019,"publication_date":"2019-03-04","ids":{"openalex":"https://openalex.org/W2920081941","doi":"https://doi.org/10.1109/tc.2019.2903055","mag":"2920081941"},"language":"en","primary_location":{"id":"doi:10.1109/tc.2019.2903055","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2019.2903055","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079372283","display_name":"Saransh Gupta","orcid":"https://orcid.org/0000-0001-5814-3934"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Saransh Gupta","raw_affiliation_strings":["Department of Computer Science and Engineering, University of California San Diego, La Jolla, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of California San Diego, La Jolla, CA, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033221192","display_name":"Mohsen Imani","orcid":"https://orcid.org/0000-0002-5761-0622"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohsen Imani","raw_affiliation_strings":["Department of Computer Science and Engineering, University of California San Diego, La Jolla, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of California San Diego, La Jolla, CA, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066054463","display_name":"Harveen Kaur","orcid":"https://orcid.org/0000-0002-6264-7585"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Harveen Kaur","raw_affiliation_strings":["Department of Computer Science and Engineering, University of California San Diego, La Jolla, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of California San Diego, La Jolla, CA, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025573294","display_name":"Tajana Rosing","orcid":"https://orcid.org/0000-0002-6954-997X"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tajana Simunic Rosing","raw_affiliation_strings":["Department of Computer Science and Engineering, University of California San Diego, La Jolla, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of California San Diego, La Jolla, CA, USA","institution_ids":["https://openalex.org/I36258959"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5079372283"],"corresponding_institution_ids":["https://openalex.org/I36258959"],"apc_list":null,"apc_paid":null,"fwci":3.2699,"has_fulltext":false,"cited_by_count":55,"citation_normalized_percentile":{"value":0.93843868,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"68","issue":"9","first_page":"1325","last_page":"1337"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8729669451713562},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.6876270771026611},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6186299324035645},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5894879102706909},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5772252082824707},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5476006269454956},{"id":"https://openalex.org/keywords/crossbar-switch","display_name":"Crossbar switch","score":0.5061630606651306},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.4837805926799774},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.47193214297294617},{"id":"https://openalex.org/keywords/computing-with-memory","display_name":"Computing with Memory","score":0.4603900611400604},{"id":"https://openalex.org/keywords/in-memory-processing","display_name":"In-Memory Processing","score":0.45104384422302246},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.4272826015949249},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.4266183078289032},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.41977664828300476},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4171045422554016},{"id":"https://openalex.org/keywords/memory-architecture","display_name":"Memory architecture","score":0.4134156405925751},{"id":"https://openalex.org/keywords/uniform-memory-access","display_name":"Uniform memory access","score":0.4091712236404419},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.36909741163253784},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.3582504391670227},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2715602517127991},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.2683892250061035},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.26444149017333984},{"id":"https://openalex.org/keywords/semiconductor-memory","display_name":"Semiconductor memory","score":0.18569394946098328},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.1258317530155182},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10853496193885803}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8729669451713562},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.6876270771026611},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6186299324035645},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5894879102706909},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5772252082824707},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5476006269454956},{"id":"https://openalex.org/C29984679","wikidata":"https://www.wikidata.org/wiki/Q1929149","display_name":"Crossbar switch","level":2,"score":0.5061630606651306},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.4837805926799774},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.47193214297294617},{"id":"https://openalex.org/C152890283","wikidata":"https://www.wikidata.org/wiki/Q4129922","display_name":"Computing with Memory","level":5,"score":0.4603900611400604},{"id":"https://openalex.org/C123593499","wikidata":"https://www.wikidata.org/wiki/Q6008583","display_name":"In-Memory Processing","level":5,"score":0.45104384422302246},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.4272826015949249},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.4266183078289032},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.41977664828300476},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4171045422554016},{"id":"https://openalex.org/C2779602883","wikidata":"https://www.wikidata.org/wiki/Q15544750","display_name":"Memory architecture","level":2,"score":0.4134156405925751},{"id":"https://openalex.org/C51290061","wikidata":"https://www.wikidata.org/wiki/Q1936765","display_name":"Uniform memory access","level":4,"score":0.4091712236404419},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.36909741163253784},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.3582504391670227},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2715602517127991},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.2683892250061035},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.26444149017333984},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.18569394946098328},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.1258317530155182},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10853496193885803},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.0},{"id":"https://openalex.org/C194222762","wikidata":"https://www.wikidata.org/wiki/Q114486","display_name":"Query by Example","level":4,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tc.2019.2903055","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2019.2903055","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.9100000262260437,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G1392834322","display_name":null,"funder_award_id":"#1730158","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"},{"id":"https://openalex.org/G6628366097","display_name":null,"funder_award_id":"#1527034","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"}],"funders":[{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320335353","display_name":"National Science Foundation of Sri Lanka","ror":"https://ror.org/010xaa060"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":66,"referenced_works":["https://openalex.org/W104184427","https://openalex.org/W179875071","https://openalex.org/W1578783943","https://openalex.org/W1686810756","https://openalex.org/W1981943579","https://openalex.org/W1986644367","https://openalex.org/W2048266589","https://openalex.org/W2061071837","https://openalex.org/W2081729575","https://openalex.org/W2094756095","https://openalex.org/W2095705004","https://openalex.org/W2097117768","https://openalex.org/W2101234009","https://openalex.org/W2103496339","https://openalex.org/W2105103777","https://openalex.org/W2119144962","https://openalex.org/W2129868601","https://openalex.org/W2134264591","https://openalex.org/W2148461049","https://openalex.org/W2152839228","https://openalex.org/W2155377787","https://openalex.org/W2163605009","https://openalex.org/W2285660444","https://openalex.org/W2300242332","https://openalex.org/W2396622873","https://openalex.org/W2402144811","https://openalex.org/W2407339173","https://openalex.org/W2508602506","https://openalex.org/W2513554817","https://openalex.org/W2518281301","https://openalex.org/W2551814622","https://openalex.org/W2562773490","https://openalex.org/W2588236721","https://openalex.org/W2613989746","https://openalex.org/W2625133503","https://openalex.org/W2625840880","https://openalex.org/W2725615981","https://openalex.org/W2744849844","https://openalex.org/W2790344283","https://openalex.org/W2799257450","https://openalex.org/W2807837291","https://openalex.org/W2809171749","https://openalex.org/W2891489843","https://openalex.org/W2900379535","https://openalex.org/W2953384591","https://openalex.org/W2964299589","https://openalex.org/W3005783121","https://openalex.org/W3121517425","https://openalex.org/W3145511514","https://openalex.org/W4212788319","https://openalex.org/W4242577057","https://openalex.org/W4319156734","https://openalex.org/W6604254268","https://openalex.org/W6607333740","https://openalex.org/W6637373629","https://openalex.org/W6674330103","https://openalex.org/W6675354045","https://openalex.org/W6677580257","https://openalex.org/W6680105153","https://openalex.org/W6681813608","https://openalex.org/W6684191040","https://openalex.org/W6712770252","https://openalex.org/W6713134421","https://openalex.org/W6751953977","https://openalex.org/W6754557550","https://openalex.org/W6789476068"],"related_works":["https://openalex.org/W3180803030","https://openalex.org/W2168550483","https://openalex.org/W4225739994","https://openalex.org/W4321062910","https://openalex.org/W2143690511","https://openalex.org/W1970751325","https://openalex.org/W2942841750","https://openalex.org/W3163143851","https://openalex.org/W2993507867","https://openalex.org/W3025845664"],"abstract_inverted_index":{"Neural":[0],"networks":[1],"(NNs)":[2],"have":[3,33],"shown":[4],"great":[5],"ability":[6],"to":[7,27,36,149,195,202],"process":[8],"emerging":[9],"applications":[10],"such":[11],"as":[12,193],"speech":[13],"recognition,":[14,16],"language":[15],"image":[17],"classification,":[18],"video":[19],"segmentation,":[20],"and":[21,46,57,106,123,157,172,189,217],"gaming.":[22],"It":[23],"is":[24,49,190,218],"therefore":[25],"important":[26],"make":[28],"NNs":[29,65],"efficient.":[30],"Although":[31],"attempts":[32],"been":[34],"made":[35],"improve":[37,141],"NNs'":[38,54,121],"computation":[39],"cost,":[40],"the":[41,50,62,92,110,125,142,151,164,173,223],"data":[42],"movement":[43],"between":[44],"memory":[45,99,156],"processing":[47,79],"cores":[48],"main":[51],"bottleneck":[52],"for":[53],"energy":[55,127,187,215],"consumption":[56],"execution":[58],"time.":[59],"This":[60],"makes":[61],"implementation":[63],"of":[64,153,166],"significantly":[66,85,119],"slower":[67],"on":[68,210],"traditional":[69],"CPU/GPU":[70],"cores.":[71],"In":[72],"this":[73],"paper,":[74],"we":[75,95,113],"propose":[76],"a":[77,97],"novel":[78],"in-memory":[80,137],"architecture,":[81],"called":[82],"NNPIM,":[83],"that":[84,101,180],"accelerates":[86],"neural":[87,204],"network's":[88],"inference":[89],"phase":[90],"inside":[91,109],"memory.":[93,111],"First,":[94],"design":[96,145,182],"crossbar":[98],"architecture":[100],"supports":[102,146],"fast":[103],"addition,":[104],"multiplication,":[105],"search":[107],"operations":[108],"Second,":[112],"introduce":[114],"simple":[115],"optimization":[116],"techniques":[117],"which":[118],"improves":[120],"performance":[122],"reduces":[124],"overall":[126],"consumption.":[128],"We":[129,162],"also":[130],"map":[131],"all":[132],"NN":[133],"functionalities":[134],"using":[135],"parallel":[136],"components.":[138],"To":[139],"further":[140],"efficiency,":[143],"our":[144,167,181],"weight":[147],"sharing":[148],"reduce":[150],"number":[152],"computations":[154],"in":[155],"consecutively":[158],"speedup":[159],"NNPIM":[160,169,207],"computation.":[161],"compare":[163],"efficiency":[165,188,216],"proposed":[168],"with":[170],"GPU":[171,199],"state-of-the-art":[174,203],"PIM":[175],"architectures.":[176],"Our":[177],"evaluation":[178],"shows":[179],"can":[183,208],"achieve":[184,209],"131.5\u00d7":[185],"higher":[186,214],"48.2\u00d7":[191],"faster":[192],"compared":[194],"NVIDIA":[196],"GTX":[197],"1,080":[198],"architecture.":[200],"Compared":[201],"network":[205],"accelerators,":[206],"an":[211],"average":[212],"3.6\u00d7":[213],"4.6\u00d7":[219],"faster,":[220],"while":[221],"providing":[222],"same":[224],"classification":[225],"accuracy.":[226]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":5}],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2025-10-10T00:00:00"}
