{"id":"https://openalex.org/W4392642233","doi":"https://doi.org/10.1109/tcsii.2024.3374725","title":"A 8.81 TFLOPS/W Deep-Reinforcement-Learning Accelerator With Delta-Based Weight Sharing and Block-Mantissa Reconfigurable PE Array","display_name":"A 8.81 TFLOPS/W Deep-Reinforcement-Learning Accelerator With Delta-Based Weight Sharing and Block-Mantissa Reconfigurable PE Array","publication_year":2024,"publication_date":"2024-03-11","ids":{"openalex":"https://openalex.org/W4392642233","doi":"https://doi.org/10.1109/tcsii.2024.3374725"},"language":"en","primary_location":{"id":"doi:10.1109/tcsii.2024.3374725","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsii.2024.3374725","pdf_url":null,"source":{"id":"https://openalex.org/S93916849","display_name":"IEEE Transactions on Circuits & Systems II Express Briefs","issn_l":"1549-7747","issn":["1549-7747","1558-3791"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems II: Express Briefs","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094113899","display_name":"Sanghyuk An","orcid":"https://orcid.org/0009-0007-1219-3128"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Sanghyuk An","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","School of Electrical Engineering, Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]},{"raw_affiliation_string":"School of Electrical Engineering, Korea","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027286037","display_name":"Junha Ryu","orcid":"https://orcid.org/0000-0001-8147-3085"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Junha Ryu","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","School of Electrical Engineering, Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]},{"raw_affiliation_string":"School of Electrical Engineering, Korea","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029169930","display_name":"Gwangtae Park","orcid":"https://orcid.org/0000-0002-9132-0311"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Gwangtae Park","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","School of Electrical Engineering, Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]},{"raw_affiliation_string":"School of Electrical Engineering, Korea","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077896259","display_name":"Hoi\u2010Jun Yoo","orcid":"https://orcid.org/0000-0002-6661-4879"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hoi-Jun Yoo","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","School of Electrical Engineering, Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology, Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]},{"raw_affiliation_string":"School of Electrical Engineering, Korea","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5094113899"],"corresponding_institution_ids":["https://openalex.org/I157485424"],"apc_list":null,"apc_paid":null,"fwci":0.7252,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.72936664,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"71","issue":"5","first_page":"2529","last_page":"2533"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11522","display_name":"VLSI and FPGA Design Techniques","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6637018918991089},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.5028755068778992},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.46953001618385315},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.4606175124645233},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.4227806329727173},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.41620680689811707},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.39485910534858704},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1923905313014984},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.18252667784690857},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.15080904960632324},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.12514260411262512},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.12129044532775879},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11944633722305298},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10956600308418274}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6637018918991089},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5028755068778992},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.46953001618385315},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.4606175124645233},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4227806329727173},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.41620680689811707},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.39485910534858704},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1923905313014984},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.18252667784690857},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.15080904960632324},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.12514260411262512},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.12129044532775879},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11944633722305298},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10956600308418274},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsii.2024.3374725","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsii.2024.3374725","pdf_url":null,"source":{"id":"https://openalex.org/S93916849","display_name":"IEEE Transactions on Circuits & Systems II Express Briefs","issn_l":"1549-7747","issn":["1549-7747","1558-3791"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems II: Express Briefs","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5711625785","display_name":null,"funder_award_id":"2021-0-00871","funder_id":"https://openalex.org/F4320335489","funder_display_name":"Institute for Information and Communications Technology Promotion"}],"funders":[{"id":"https://openalex.org/F4320335489","display_name":"Institute for Information and Communications Technology Promotion","ror":"https://ror.org/01g0hqq23"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W2899063892","https://openalex.org/W2907537824","https://openalex.org/W2920954974","https://openalex.org/W2968983352","https://openalex.org/W2982316857","https://openalex.org/W3088811935","https://openalex.org/W3162607076","https://openalex.org/W4205825342","https://openalex.org/W6748839928","https://openalex.org/W6756007670","https://openalex.org/W6786275528"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W2964765435"],"abstract_inverted_index":{"TD3":[0],"is":[1],"one":[2],"of":[3,74,139,150],"the":[4,49,132],"most":[5],"high-performing":[6],"Deep":[7],"Reinforcement":[8],"Learning":[9],"(DRL)":[10],"algorithms,":[11],"providing":[12],"high":[13,27],"training":[14],"stability":[15],"and":[16,32,40,44,66,81,86,101],"rewards.":[17],"However,":[18],"it":[19,145],"suffers":[20],"from":[21],"low":[22],"energy":[23,45,148],"efficiency":[24,149],"due":[25],"to":[26,71,76,103,113],"External":[28],"Memory":[29],"Access":[30],"(EMA)":[31],"floating":[33],"point":[34],"operations.":[35],"To":[36],"mitigate":[37],"this":[38],"issue":[39],"achieve":[41],"higher":[42],"throughput":[43],"efficiency,":[46],"we":[47],"propose":[48],"DRL":[50],"accelerator":[51],"with":[52,134,143],"3":[53],"features:":[54],"1)":[55],"Delta-based":[56],"Weight":[57],"Sharing":[58],"(DWS)":[59],"represents":[60],"weights":[61],"by":[62],"referencing":[63],"corresponding":[64],"network":[65],"exploits":[67],"data":[68,128],"locality,":[69],"leading":[70],"EMA":[72],"reduction":[73],"up":[75,112],"64.3%":[77],"in":[78,83,99,111,117],"feed-forward":[79],"stage":[80],"39.7%":[82],"gradient":[84],"generation":[85],"weight":[87],"update":[88],"stage.":[89],"2)":[90],"Block-Mantissa":[91],"Reconfigurable":[92],"PE":[93],"Array":[94],"(BMRPA)":[95],"supports":[96,124],"variable":[97],"operations":[98],"blocks":[100],"mantissa":[102],"provide":[104],"optimal":[105],"precision":[106],"for":[107],"each":[108],"layer,":[109],"resulting":[110],"a":[114],"4\u00d7":[115],"increase":[116],"throughput.":[118],"3)":[119],"Multi-mode":[120],"Data":[121],"Fetcher":[122],"(MDF)":[123],"bit":[125],"width":[126],"adaptive":[127],"fetching,":[129],"achieving":[130],"twice":[131],"bandwidth":[133],"an":[135,147],"average":[136],"read":[137],"overhead":[138],"5.3%.":[140],"When":[141],"combined":[142],"BMRPA,":[144],"attains":[146],"8.81":[151],"TFLOPS/W.":[152]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
