{"id":"https://openalex.org/W2908466063","doi":"https://doi.org/10.1109/newcas.2018.8585656","title":"Identifying and Exploiting Ineffectual Computations to Enable Hardware Acceleration of Deep Learning","display_name":"Identifying and Exploiting Ineffectual Computations to Enable Hardware Acceleration of Deep Learning","publication_year":2018,"publication_date":"2018-06-01","ids":{"openalex":"https://openalex.org/W2908466063","doi":"https://doi.org/10.1109/newcas.2018.8585656","mag":"2908466063"},"language":"en","primary_location":{"id":"doi:10.1109/newcas.2018.8585656","is_oa":false,"landing_page_url":"https://doi.org/10.1109/newcas.2018.8585656","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 16th IEEE International New Circuits and Systems Conference (NEWCAS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072544251","display_name":"Andreas Moshovos","orcid":"https://orcid.org/0000-0001-7768-367X"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Andreas Moshovos","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005950098","display_name":"Jorge Albericio","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jorge Albericio","raw_affiliation_strings":["NVIDIA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NVIDIA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090235913","display_name":"Patrick Judd","orcid":"https://orcid.org/0000-0001-8177-200X"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Patrick Judd","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084461132","display_name":"Alberto Delm\u00e1s","orcid":null},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Alberto Delmas","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061847219","display_name":"Sayeh Sharify","orcid":null},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Sayeh Sharify","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103806733","display_name":"Mostafa Mahmoud","orcid":"https://orcid.org/0000-0002-9100-7966"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Mostafa Mahmoud","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034060699","display_name":"Tayler Hetherington","orcid":null},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Tayler Hetherington","raw_affiliation_strings":["University of British Columbia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of British Columbia","institution_ids":["https://openalex.org/I141945490"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101550828","display_name":"Milo\u0161 Nikoli\u0107","orcid":"https://orcid.org/0000-0002-4168-0837"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Milos Nikolic","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069857678","display_name":"Dylan Malone Stuart","orcid":null},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Dylan Malone Stuart","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014486668","display_name":"Kevin Siu","orcid":null},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Kevin Siu","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018312650","display_name":"Zissis Poulos","orcid":"https://orcid.org/0000-0002-2427-7413"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Zissis Poulos","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026788167","display_name":"Tor M. Aamodt","orcid":"https://orcid.org/0000-0003-1161-692X"},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Tor Aamodt","raw_affiliation_strings":["University of British Columbia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of British Columbia","institution_ids":["https://openalex.org/I141945490"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060103552","display_name":"Natalie Enright Jerger","orcid":"https://orcid.org/0000-0002-0526-2080"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Natalie Enright Jerger","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":13,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.106,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.49214725,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":"abs 1706 504","issue":null,"first_page":"356","last_page":"360"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8281701803207397},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.7443954944610596},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6350516080856323},{"id":"https://openalex.org/keywords/reuse","display_name":"Reuse","score":0.5743978023529053},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5412648916244507},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5325704216957092},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.4571187496185303},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.446880578994751},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4465288817882538},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.4317065477371216},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.4247589111328125},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.3871249556541443},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.36812636256217957},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3623817563056946},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.28447192907333374},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2225225567817688},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10899540781974792},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.10104489326477051}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8281701803207397},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.7443954944610596},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6350516080856323},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.5743978023529053},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5412648916244507},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5325704216957092},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.4571187496185303},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.446880578994751},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4465288817882538},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.4317065477371216},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.4247589111328125},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3871249556541443},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.36812636256217957},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3623817563056946},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.28447192907333374},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2225225567817688},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10899540781974792},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.10104489326477051},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/newcas.2018.8585656","is_oa":false,"landing_page_url":"https://doi.org/10.1109/newcas.2018.8585656","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 16th IEEE International New Circuits and Systems Conference (NEWCAS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.8999999761581421,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1902934009","https://openalex.org/W1970027940","https://openalex.org/W2048266589","https://openalex.org/W2098335003","https://openalex.org/W2246760854","https://openalex.org/W2279098554","https://openalex.org/W2285660444","https://openalex.org/W2516141709","https://openalex.org/W2529546376","https://openalex.org/W2541839172","https://openalex.org/W2554302513","https://openalex.org/W2617247391","https://openalex.org/W2625457103","https://openalex.org/W2742044963","https://openalex.org/W2797864974","https://openalex.org/W2919115771","https://openalex.org/W2952857977","https://openalex.org/W4240168186","https://openalex.org/W4247198796","https://openalex.org/W4301131225","https://openalex.org/W6639703010","https://openalex.org/W6651700774","https://openalex.org/W6695314431","https://openalex.org/W6738105350","https://openalex.org/W6738885641","https://openalex.org/W6742680294","https://openalex.org/W6750320991","https://openalex.org/W6764418811"],"related_works":["https://openalex.org/W17155033","https://openalex.org/W3207760230","https://openalex.org/W1496222301","https://openalex.org/W1590307681","https://openalex.org/W4319952061","https://openalex.org/W4280636456","https://openalex.org/W4388913998","https://openalex.org/W4310584535","https://openalex.org/W4295935044","https://openalex.org/W3159906349"],"abstract_inverted_index":{"This":[0],"article":[1],"summarizes":[2],"somde":[3],"of":[4,53,123,136,140,154,167],"our":[5],"work":[6],"on":[7,87],"hardware":[8,21,61,155],"accelerators":[9],"for":[10,23],"inference":[11],"with":[12],"Deep":[13],"Learning":[14],"Neural":[15],"Networks":[16],"(DNNs).":[17],"Early":[18],"success":[19],"in":[20,33,49,75,96,138,179],"acceleration":[22],"DNNs":[24,54],"exploited":[25],"the":[26,30,50,60,120,184],"computation":[27],"structure":[28],"and":[29,69,72,79,108,145,150,193],"significant":[31],"reuse":[32],"their":[34],"access":[35],"stream.":[36],"Our":[37],"approach":[38],"to":[39,45,63,94,127,160,199],"further":[40],"boost":[41],"benefits":[42],"has":[43],"been":[44,85],"first":[46],"identify":[47],"properties":[48,88,99,186],"value":[51],"stream":[52],"which":[55],"we":[56],"can":[57],"exploit":[58],"at":[59],"level":[62],"improve":[64],"execution":[65,80,147],"time,":[66],"reduce":[67],"off-":[68],"on-chip":[70],"communication":[71],"storage,":[73],"resulting":[74],"higher":[76],"energy":[77,143],"efficiency":[78],"time":[81,148],"reduction.":[82],"We":[83],"have":[84,114],"focusing":[86],"that":[89,102,109,113,125,171,182],"are":[90,103],"difficult":[91],"or":[92,105,118,191],"impossible":[93],"discern":[95],"advance.":[97],"These":[98],"include":[100],"values":[101,112,124],"zero":[104,107],"near":[106],"prove":[110],"ineffectual,":[111],"reduced":[115,189],"precision":[116,190],"needs,":[117],"even":[119],"bit-level":[121],"content":[122],"lead":[126],"ineffectual":[128],"computations.":[129],"The":[130],"presented":[131],"designs":[132,169],"cover":[133],"a":[134,152,196],"spectrum":[135],"choices":[137],"terms":[139],"area":[141],"cost,":[142],"efficiency,":[144],"relative":[146],"performance":[149],"target":[151],"variety":[153],"devices":[156],"from":[157],"embedded":[158],"systems":[159],"server":[161],"class":[162],"machines.":[163],"A":[164],"key":[165],"characteristic":[166],"these":[168],"is":[170],"they":[172],"reward":[173],"but":[174],"do":[175],"not":[176],"requires":[177],"advances":[178],"model":[180],"design":[181],"increase":[183],"aforementioned":[185],"(such":[187],"as":[188],"sparsity)":[192],"thus":[194],"provide":[195],"safe":[197],"path":[198],"innovation.":[200]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
