{"id":"https://openalex.org/W4285225262","doi":"https://doi.org/10.1109/tc.2022.3184272","title":"DyNNamic: Dynamically Reshaping, High Data-Reuse Accelerator for Compact DNNs","display_name":"DyNNamic: Dynamically Reshaping, High Data-Reuse Accelerator for Compact DNNs","publication_year":2023,"publication_date":"2023-03-01","ids":{"openalex":"https://openalex.org/W4285225262","doi":"https://doi.org/10.1109/tc.2022.3184272"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2022.3184272","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["1557-9956","2326-3814","0018-9340"],"is_oa":false,"is_in_doaj":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074284629","display_name":"Edward Hanson","orcid":"https://orcid.org/0000-0001-5179-8401"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Edward Hanson","raw_affiliation_string":"Electrical and Computer Engineering, Duke University, Durham, NC, USA","raw_affiliation_strings":["Electrical and Computer Engineering, Duke University, Durham, NC, USA"]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066123079","display_name":"Shiyu Li","orcid":"https://orcid.org/0000-0002-1990-7150"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shiyu Li","raw_affiliation_string":"Electrical and Computer Engineering, Duke University, Durham, NC, USA","raw_affiliation_strings":["Electrical and Computer Engineering, Duke University, Durham, NC, USA"]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047215143","display_name":"Xuehai Qian","orcid":null},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xuehai Qian","raw_affiliation_string":"Ming Hsieh Department of Electrical Engineering, University of Southern California, Los Angeles, CA, USA","raw_affiliation_strings":["Ming Hsieh Department of Electrical Engineering, University of Southern California, Los Angeles, CA, USA"]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075474462","display_name":"Hai Li","orcid":"https://orcid.org/0000-0003-3228-6544"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hai Helen Li","raw_affiliation_string":"Electrical and Computer Engineering, Duke University, Durham, NC, USA","raw_affiliation_strings":["Electrical and Computer Engineering, Duke University, Durham, NC, USA"]},{"author_position":"last","author":{"id":"https://openalex.org/A5058073627","display_name":"Yiran Chen","orcid":"https://orcid.org/0000-0002-1486-8412"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiran Chen","raw_affiliation_string":"Electrical and Computer Engineering, Duke University, Durham, NC, USA","raw_affiliation_strings":["Electrical and Computer Engineering, Duke University, Durham, NC, USA"]}],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"has_fulltext":false,"cited_by_count":0,"cited_by_percentile_year":{"min":0,"max":82},"biblio":{"volume":"72","issue":"3","first_page":"880","last_page":"892"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Deep Learning in Computer Vision and Image Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Deep Learning in Computer Vision and Image Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Deep Learning Models","score":0.9967,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Advances in Transfer Learning and Domain Adaptation","score":0.9929,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"keyword":"dynamically reshaping","score":0.3325},{"keyword":"data-reuse","score":0.25}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.74396557},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.57132894},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.54666746},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.53884053},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.51456946},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.50428855},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.49776366},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.49055547},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.4902623},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.45833403},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3615206},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.33770847},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32852167},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.30338866},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.22152135},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18116343},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14236331},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2022.3184272","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["1557-9956","2326-3814","0018-9340"],"is_oa":false,"is_in_doaj":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.91}],"grants":[{"funder":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka","award_id":"1955246"},{"funder":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka","award_id":"1937435"}],"referenced_works_count":20,"referenced_works":["https://openalex.org/W2108598243","https://openalex.org/W2194775991","https://openalex.org/W2289252105","https://openalex.org/W2531409750","https://openalex.org/W2588191434","https://openalex.org/W2623629680","https://openalex.org/W2625457103","https://openalex.org/W2900228909","https://openalex.org/W2909419460","https://openalex.org/W2928560789","https://openalex.org/W2940862705","https://openalex.org/W2945146780","https://openalex.org/W2953212265","https://openalex.org/W2963163009","https://openalex.org/W2963844898","https://openalex.org/W2979439447","https://openalex.org/W3092319711","https://openalex.org/W4240168186","https://openalex.org/W4253012315","https://openalex.org/W4255951808"],"related_works":["https://openalex.org/W4319952061","https://openalex.org/W4280636456","https://openalex.org/W4388913998","https://openalex.org/W4310584535","https://openalex.org/W4295935044","https://openalex.org/W3159906349","https://openalex.org/W2000444236","https://openalex.org/W2384475851","https://openalex.org/W2353602216","https://openalex.org/W2367078749"],"ngrams_url":"https://api.openalex.org/works/W4285225262/ngrams","abstract_inverted_index":{"Convolutional":[0],"layers":[1,38],"dominate":[2],"the":[3,116,146,149,159],"computation":[4],"and":[5,26,44,55,81,127,177,190,198],"energy":[6,56,197],"costs":[7],"of":[8,36,78,85,88,195],"Deep":[9],"Neural":[10],"Network":[11],"(DNN)":[12],"inference.":[13],"Recent":[14],"algorithmic":[15],"works":[16],"attempt":[17],"to":[18,39,67,75,114,143,148],"reduce":[19,40],"these":[20,59,94],"bottlenecks":[21],"via":[22],"compact":[23,89,121],"DNN":[24,90],"structures":[25],"model":[27],"compression.":[28],"Likewise,":[29],"state-of-the-art":[30,180],"accelerator":[31],"designs":[32],"leverage":[33],"spatiotemporal":[34],"characteristics":[35],"convolutional":[37],"data":[41,164],"movement":[42,165],"overhead":[43],"improve":[45],"throughput.":[46],"Although":[47],"both":[48,132],"are":[49],"independently":[50],"effective":[51],"at":[52],"reducing":[53,163],"latency":[54],"costs,":[57],"combining":[58],"approaches":[60],"does":[61],"not":[62],"guarantee":[63],"cumulative":[64],"improvements":[65],"due":[66],"inefficient":[68],"mapping.":[69],"This":[70],"inefficiency":[71],"can":[72],"be":[73],"attributed":[74],"(1)":[76],"inflexibility":[77],"underlying":[79],"hardware":[80],"(2)":[82],"inherent":[83],"reduction":[84],"data-reuse":[86,102,155],"opportunities":[87,156],"structures.":[91],"To":[92],"address":[93],"issues,":[95],"we":[96],"propose":[97],"a":[98],"dynamically":[99],"reshaping,":[100],"high":[101],"PE":[103,141],"array":[104,142],"accelerator,":[105],"namely":[106],"DyNNamic":[107],".":[108],"DyNNamic":[109,138,184],"leverages":[110],"kernel-wise":[111],"filter":[112],"decomposition":[113],"partition":[115],"convolution":[117],"operation":[118],"into":[119],"two":[120],"stages:":[122],"Shared":[123],"Kernels":[124],"Convolution":[125],"(SKC)":[126],"Weighted":[128],"Accumulation":[129],"(WA).":[130],"Because":[131],"stages":[133],"have":[134],"vastly":[135],"different":[136],"dimensions,":[137],"reshapes":[139],"its":[140],"effectively":[144],"map":[145],"algorithm":[147],"architecture.":[150],"The":[151],"architecture":[152],"then":[153],"exploits":[154],"created":[157],"by":[158,187],"SKC":[160],"stage,":[161],"further":[162],"with":[166],"negligible":[167],"overhead.":[168],"We":[169],"evaluate":[170],"our":[171],"approach":[172],"on":[173],"various":[174],"representative":[175],"networks":[176],"compare":[178],"against":[179],"accelerators.":[181],"On":[182],"average,":[183],"outperforms":[185],"DianNao":[186],"$8.4\\times$":[189],"notation=\"LaTeX\">$12.3\\times$":[192],"in":[193],"terms":[194],"inference":[196],"latency,":[199],"respectively.":[200]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4285225262","counts_by_year":[],"updated_date":"2024-03-19T14:51:18.423103","created_date":"2022-07-14"}