{"id":"https://openalex.org/W2793950911","doi":"https://doi.org/10.1109/tnnls.2018.2808319","title":"Ristretto: A Framework for Empirical Study of Resource-Efficient Inference in Convolutional Neural Networks","display_name":"Ristretto: A Framework for Empirical Study of Resource-Efficient Inference in Convolutional Neural Networks","publication_year":2018,"publication_date":"2018-03-16","ids":{"openalex":"https://openalex.org/W2793950911","doi":"https://doi.org/10.1109/tnnls.2018.2808319","mag":"2793950911","pmid":"https://pubmed.ncbi.nlm.nih.gov/29993820"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2018.2808319","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2018.2808319","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049002650","display_name":"Philipp Gysel","orcid":"https://orcid.org/0000-0003-1681-9662"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Philipp Gysel","raw_affiliation_strings":["Laboratory for Embedded and Programmable Systems, University of California at Davis, Davis, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-1681-9662","affiliations":[{"raw_affiliation_string":"Laboratory for Embedded and Programmable Systems, University of California at Davis, Davis, CA, USA","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033433243","display_name":"Jon J. Pimentel","orcid":"https://orcid.org/0000-0002-0833-0392"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jon Pimentel","raw_affiliation_strings":["VLSI Computation Laboratory, University of California at Davis, Davis, CA, USA"],"raw_orcid":"https://orcid.org/0000-0002-0833-0392","affiliations":[{"raw_affiliation_string":"VLSI Computation Laboratory, University of California at Davis, Davis, CA, USA","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101525467","display_name":"Mohammad Motamedi","orcid":"https://orcid.org/0000-0003-0120-8738"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohammad Motamedi","raw_affiliation_strings":["Laboratory for Embedded and Programmable Systems, University of California at Davis, Davis, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Laboratory for Embedded and Programmable Systems, University of California at Davis, Davis, CA, USA","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031842294","display_name":"Soheil Ghiasi","orcid":"https://orcid.org/0000-0002-1036-791X"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Soheil Ghiasi","raw_affiliation_strings":["Laboratory for Embedded and Programmable Systems, University of California at Davis, Davis, CA, USA"],"raw_orcid":"https://orcid.org/0000-0002-1036-791X","affiliations":[{"raw_affiliation_string":"Laboratory for Embedded and Programmable Systems, University of California at Davis, Davis, CA, USA","institution_ids":["https://openalex.org/I84218800"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5049002650"],"corresponding_institution_ids":["https://openalex.org/I84218800"],"apc_list":null,"apc_paid":null,"fwci":15.7219,"has_fulltext":false,"cited_by_count":245,"citation_normalized_percentile":{"value":0.99216085,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"29","issue":"11","first_page":"5784","last_page":"5789"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7812018394470215},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7535011768341064},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7062333822250366},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47265541553497314},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.46712595224380493},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.08405658602714539}],"concepts":[{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7812018394470215},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7535011768341064},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7062333822250366},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47265541553497314},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.46712595224380493},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.08405658602714539}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2018.2808319","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2018.2808319","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:29993820","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/29993820","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4890808801","display_name":null,"funder_award_id":"CCF-1346812","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1825672851","https://openalex.org/W1903029394","https://openalex.org/W2090557012","https://openalex.org/W2097117768","https://openalex.org/W2115611348","https://openalex.org/W2117539524","https://openalex.org/W2119144962","https://openalex.org/W2155893237","https://openalex.org/W2163605009","https://openalex.org/W2186094539","https://openalex.org/W2279098554","https://openalex.org/W2319920447","https://openalex.org/W2337344472","https://openalex.org/W2524428287","https://openalex.org/W2560017826","https://openalex.org/W2571689128","https://openalex.org/W2612864759","https://openalex.org/W2756009169","https://openalex.org/W2950894517","https://openalex.org/W2963424132","https://openalex.org/W2964299589","https://openalex.org/W4294371482","https://openalex.org/W6677580257","https://openalex.org/W6684191040","https://openalex.org/W6703414193","https://openalex.org/W6730047919"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Convolutional":[0],"neural":[1],"networks":[2,199],"(CNNs)":[3],"have":[4],"led":[5],"to":[6,36,40,72,124,128,167,194,203],"remarkable":[7],"progress":[8],"in":[9,84],"a":[10,33,68,90,119,164,174,183,218],"number":[11,103,176],"of":[12,65,98,113,135,147,189,234,237],"key":[13],"pattern":[14],"recognition":[15],"tasks,":[16],"such":[17],"as":[18,217,233],"visual":[19],"scene":[20],"understanding":[21],"and":[22,58,105,109,132,137,141,178,212,223],"speech":[23],"recognition,":[24],"that":[25,94,196],"potentially":[26],"enable":[27,62],"numerous":[28],"applications.":[29],"Consequently,":[30],"there":[31],"is":[32,71,215],"significant":[34,52],"need":[35],"deploy":[37],"trained":[38,66],"CNNs":[39],"resource-constrained":[41],"embedded":[42],"systems.":[43],"Inference":[44],"using":[45],"pretrained":[46],"modern":[47],"deep":[48],"CNNs,":[49,67],"however,":[50],"requires":[51],"system":[53],"resources,":[54],"including":[55],"computation,":[56],"energy,":[57],"memory":[59],"space.":[60],"To":[61],"efficient":[63],"implementation":[64],"viable":[69],"approach":[70],"approximate":[73],"the":[74,99,110,114,145,157,235],"network":[75,166,210],"with":[76,80,122],"an":[77],"implementation-friendly":[78],"model":[79,158],"only":[81],"negligible":[82],"degradation":[83,187],"classification":[85,111,171,185],"accuracy.":[86,159],"We":[87],"present":[88],"Ristretto,":[89],"CNN":[91,121],"approximation":[92],"framework":[93],"enables":[95],"empirical":[96],"investigation":[97],"tradeoff":[100],"between":[101],"various":[102],"representation":[104,177],"word":[106,149,179],"width":[107,150,180],"choices":[108],"accuracy":[112,172,186],"model.":[115],"Specifically,":[116],"Ristretto":[117,161,193,214],"analyzes":[118],"given":[120,175],"respect":[123],"numerical":[125],"range":[126],"required":[127],"represent":[129],"weights,":[130],"activations,":[131],"intermediate":[133],"results":[134],"convolutional":[136],"fully":[138],"connected":[139],"layers,":[140],"subsequently,":[142],"it":[143],"simulates":[144],"impact":[146],"reduced":[148],"or":[151],"lower":[152],"precision":[153],"arithmetic":[154],"operators":[155],"on":[156,231],"Moreover,":[160],"can":[162,200],"fine-tune":[163],"quantized":[165],"further":[168],"improve":[169],"its":[170],"under":[173],"configuration.":[181],"Given":[182],"maximum":[184],"tolerance":[188],"1%,":[190],"we":[191],"use":[192,204],"demonstrate":[195],"three":[197],"ImageNet":[198],"be":[201],"condensed":[202],"8-bit":[205],"dynamic":[206],"fixed":[207],"point":[208],"for":[209],"weights":[211],"activations.":[213],"available":[216],"popular":[219],"open-source":[220],"software":[221],"project":[222],"has":[224],"already":[225],"been":[226],"viewed":[227],"over":[228],"1,000":[229],"times":[230],"Github":[232],"submission":[236],"this":[238],"brief.":[239]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":21},{"year":2023,"cited_by_count":29},{"year":2022,"cited_by_count":35},{"year":2021,"cited_by_count":41},{"year":2020,"cited_by_count":54},{"year":2019,"cited_by_count":38},{"year":2018,"cited_by_count":15}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
