{"id":"https://openalex.org/W4312813449","doi":"https://doi.org/10.1109/iscas48785.2022.9937832","title":"Optimization of DRAM based PIM Architecture for Energy-Efficient Deep Neural Network Training","display_name":"Optimization of DRAM based PIM Architecture for Energy-Efficient Deep Neural Network Training","publication_year":2022,"publication_date":"2022-05-28","ids":{"openalex":"https://openalex.org/W4312813449","doi":"https://doi.org/10.1109/iscas48785.2022.9937832"},"language":"en","primary_location":{"id":"doi:10.1109/iscas48785.2022.9937832","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscas48785.2022.9937832","pdf_url":null,"source":{"id":"https://openalex.org/S4363604393","display_name":"2022 IEEE International Symposium on Circuits and Systems (ISCAS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Symposium on Circuits and Systems (ISCAS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046990456","display_name":"Chirag Sudarshan","orcid":"https://orcid.org/0000-0002-1651-1935"},"institutions":[{"id":"https://openalex.org/I153267046","display_name":"University of Kaiserslautern","ror":"https://ror.org/04zrf7b53","country_code":"DE","type":"education","lineage":["https://openalex.org/I153267046"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Chirag Sudarshan","raw_affiliation_strings":["Technische Universit&#x00E4;t Kaiserslautern,Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t Kaiserslautern,Germany","institution_ids":["https://openalex.org/I153267046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003224930","display_name":"Mohammad Hassani Sadi","orcid":"https://orcid.org/0009-0009-6946-3330"},"institutions":[{"id":"https://openalex.org/I153267046","display_name":"University of Kaiserslautern","ror":"https://ror.org/04zrf7b53","country_code":"DE","type":"education","lineage":["https://openalex.org/I153267046"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Mohammad Hassani Sadi","raw_affiliation_strings":["Technische Universit&#x00E4;t Kaiserslautern,Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t Kaiserslautern,Germany","institution_ids":["https://openalex.org/I153267046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090870819","display_name":"Christian Weis","orcid":"https://orcid.org/0000-0002-4152-0200"},"institutions":[{"id":"https://openalex.org/I153267046","display_name":"University of Kaiserslautern","ror":"https://ror.org/04zrf7b53","country_code":"DE","type":"education","lineage":["https://openalex.org/I153267046"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christian Weis","raw_affiliation_strings":["Technische Universit&#x00E4;t Kaiserslautern,Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t Kaiserslautern,Germany","institution_ids":["https://openalex.org/I153267046"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059285190","display_name":"Norbert Wehn","orcid":"https://orcid.org/0000-0002-9010-086X"},"institutions":[{"id":"https://openalex.org/I153267046","display_name":"University of Kaiserslautern","ror":"https://ror.org/04zrf7b53","country_code":"DE","type":"education","lineage":["https://openalex.org/I153267046"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Norbert Wehn","raw_affiliation_strings":["Technische Universit&#x00E4;t Kaiserslautern,Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t Kaiserslautern,Germany","institution_ids":["https://openalex.org/I153267046"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5046990456"],"corresponding_institution_ids":["https://openalex.org/I153267046"],"apc_list":null,"apc_paid":null,"fwci":0.4797,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.7361329,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1472","last_page":"1476"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8108766078948975},{"id":"https://openalex.org/keywords/dram","display_name":"Dram","score":0.7847403287887573},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5679234862327576},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5196234583854675},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4368618130683899},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.4134064018726349},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.36419039964675903},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3519548773765564},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3495960533618927},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.34325551986694336},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.2692558169364929},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.14730101823806763},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.11368528008460999},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11075916886329651}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8108766078948975},{"id":"https://openalex.org/C7366592","wikidata":"https://www.wikidata.org/wiki/Q1255620","display_name":"Dram","level":2,"score":0.7847403287887573},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5679234862327576},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5196234583854675},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4368618130683899},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.4134064018726349},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.36419039964675903},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3519548773765564},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3495960533618927},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.34325551986694336},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.2692558169364929},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.14730101823806763},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.11368528008460999},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11075916886329651},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscas48785.2022.9937832","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscas48785.2022.9937832","pdf_url":null,"source":{"id":"https://openalex.org/S4363604393","display_name":"2022 IEEE International Symposium on Circuits and Systems (ISCAS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Symposium on Circuits and Systems (ISCAS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.8999999761581421}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W2551176409","https://openalex.org/W2555826082","https://openalex.org/W2765234579","https://openalex.org/W2799613139","https://openalex.org/W2809205380","https://openalex.org/W2896090304","https://openalex.org/W2904200161","https://openalex.org/W2943178787","https://openalex.org/W2945287634","https://openalex.org/W2946829484","https://openalex.org/W2949989598","https://openalex.org/W2963809228","https://openalex.org/W2980688670","https://openalex.org/W2982008795","https://openalex.org/W2990844796","https://openalex.org/W3016021860","https://openalex.org/W3036878841","https://openalex.org/W3100639723","https://openalex.org/W3100710793","https://openalex.org/W3118608800","https://openalex.org/W3127930667","https://openalex.org/W3134274954","https://openalex.org/W3134703406","https://openalex.org/W3136402052","https://openalex.org/W3142170088","https://openalex.org/W3158634533","https://openalex.org/W4250482878","https://openalex.org/W6729971367","https://openalex.org/W6770699648","https://openalex.org/W6787972765"],"related_works":["https://openalex.org/W2292897598","https://openalex.org/W1764185321","https://openalex.org/W1997145140","https://openalex.org/W2056763347","https://openalex.org/W2034384303","https://openalex.org/W2901309973","https://openalex.org/W2044629287","https://openalex.org/W2619024801","https://openalex.org/W2127764549","https://openalex.org/W4280607449"],"abstract_inverted_index":{"Deep":[0],"Neural":[1],"Network":[2],"(DNN)":[3],"training":[4,65],"consumes":[5],"high-energy.":[6],"On":[7],"the":[8,32,37,56,67,78,82,96,115,121,127,141,153,166,173,189,218],"other":[9],"hand,":[10],"DNNs":[11],"deployed":[12],"on":[13],"edge":[14],"devices":[15],"demand":[16],"very":[17,102],"high-energy":[18],"efficiency.":[19],"In":[20],"this":[21],"context,":[22],"Processing-in-Memory":[23],"(PIM)":[24],"is":[25,66,111,181],"an":[26],"emerging":[27],"compute":[28],"paradigm":[29],"that":[30,138,192,216],"bridges":[31],"memory-computation":[33],"gap":[34],"to":[35,106,113,147,158,182,228],"improve":[36],"energy-efficiency.":[38],"DRAMs":[39],"are":[40],"one":[41],"such":[42],"memory":[43,79],"type":[44],"employed":[45],"for":[46,51,63,124],"designing":[47],"energy-efficient":[48],"PIM":[49,83,99],"architectures":[50,61,100],"DNN":[52,64],"training.":[53,177],"One":[54],"of":[55,59,70,130,162,165,197,221],"major":[57],"issues":[58],"DRAM-PIM":[60],"designed":[62],"high":[68,103,209],"number":[69,220],"internal":[71,92,116,142],"data":[72,93,117,143,155,163,202,222],"accesses":[73,94,161],"within":[74,120,188],"a":[75,184,207],"bank":[76,123,154,191],"between":[77],"arrays":[80],"and":[81,200,232],"computation":[84,107],"units":[85],"(e.g.":[86],"51%":[87],"more":[88],"than":[89],"inference).":[90],"These":[91],"in":[95],"state-of-the-art":[97],"DRAM":[98,122,190],"consume":[101],"energy":[104,119,128,145,224],"compared":[105,227],"units.":[108],"Hence,":[109],"it":[110],"important":[112],"reduce":[114,140],"access":[118,144,156,223],"further":[125],"improving":[126],"efficiency":[129],"DRAMPIM":[131],"architectures.":[132],"We":[133],"present":[134],"three":[135],"novel":[136],"optimizations":[137],"together":[139],"up":[146],"81.54%.":[148],"Our":[149],"first":[150],"optimization":[151,180],"modifies":[152],"circuit":[157],"enable":[159],"partial":[160],"instead":[164],"conventional":[167],"fixed":[168],"granularity":[169],"accesses,":[170],"thereby":[171],"exploiting":[172],"available":[174],"sparsity":[175],"during":[176],"The":[178],"second":[179],"have":[183],"dedicated":[185],"low-energy":[186],"region":[187],"has":[193],"low":[194],"capacitive":[195],"load":[196],"global":[198],"wires":[199],"shorter":[201],"movement.":[203],"Finally,":[204],"we":[205],"propose":[206],"12-bit":[208],"dynamic":[210],"range":[211],"floating-point":[212],"format":[213],"called":[214],"TinyFloat":[215],"reduces":[217],"total":[219],"by":[225],"20%":[226],"IEEE":[229],"754":[230],"half":[231],"single":[233],"precision.":[234]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
