{"id":"https://openalex.org/W3180864037","doi":"https://doi.org/10.1145/3440016","title":"Compressing RNNs to Kilobyte Budget for IoT Devices Using Kronecker Products","display_name":"Compressing RNNs to Kilobyte Budget for IoT Devices Using Kronecker Products","publication_year":2021,"publication_date":"2021-07-14","ids":{"openalex":"https://openalex.org/W3180864037","doi":"https://doi.org/10.1145/3440016","mag":"3180864037"},"language":"en","primary_location":{"id":"doi:10.1145/3440016","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3440016","pdf_url":null,"source":{"id":"https://openalex.org/S96198239","display_name":"ACM Journal on Emerging Technologies in Computing Systems","issn_l":"1550-4832","issn":["1550-4832","1550-4840"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Journal on Emerging Technologies in Computing Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090396089","display_name":"Urmish Thakker","orcid":"https://orcid.org/0000-0002-0515-9155"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Urmish Thakker","raw_affiliation_strings":["Arm ML Research Lab, Austin, TX"],"affiliations":[{"raw_affiliation_string":"Arm ML Research Lab, Austin, TX","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056063665","display_name":"Igor Fedorov","orcid":"https://orcid.org/0000-0002-7235-4823"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Igor Fedorov","raw_affiliation_strings":["Arm ML Research Lab, Austin, TX"],"affiliations":[{"raw_affiliation_string":"Arm ML Research Lab, Austin, TX","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112610083","display_name":"Chu Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chu Zhou","raw_affiliation_strings":["Arm ML Research Lab, Austin, TX"],"affiliations":[{"raw_affiliation_string":"Arm ML Research Lab, Austin, TX","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078130628","display_name":"Dibakar Gope","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dibakar Gope","raw_affiliation_strings":["Arm ML Research Lab, Austin, TX"],"affiliations":[{"raw_affiliation_string":"Arm ML Research Lab, Austin, TX","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090422974","display_name":"Matthew Mattina","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Matthew Mattina","raw_affiliation_strings":["Arm ML Research Lab, Austin, TX"],"affiliations":[{"raw_affiliation_string":"Arm ML Research Lab, Austin, TX","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004292742","display_name":"Ganesh Dasika","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ganesh Dasika","raw_affiliation_strings":["AMD Research, Austin, TX"],"affiliations":[{"raw_affiliation_string":"AMD Research, Austin, TX","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013531730","display_name":"Jesse Beu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jesse Beu","raw_affiliation_strings":["Arm ML Research Lab, Boston, MA"],"affiliations":[{"raw_affiliation_string":"Arm ML Research Lab, Boston, MA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5090396089"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3817,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.799148,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"17","issue":"4","first_page":"1","last_page":"18"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.8307379484176636},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7866164445877075},{"id":"https://openalex.org/keywords/kronecker-product","display_name":"Kronecker product","score":0.4898483455181122},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.44130146503448486},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.36879101395606995},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3627300262451172},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3467084765434265},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.240202397108078},{"id":"https://openalex.org/keywords/kronecker-delta","display_name":"Kronecker delta","score":0.21159353852272034}],"concepts":[{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.8307379484176636},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7866164445877075},{"id":"https://openalex.org/C46030957","wikidata":"https://www.wikidata.org/wiki/Q1238125","display_name":"Kronecker product","level":3,"score":0.4898483455181122},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.44130146503448486},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.36879101395606995},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3627300262451172},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3467084765434265},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.240202397108078},{"id":"https://openalex.org/C39482219","wikidata":"https://www.wikidata.org/wiki/Q192826","display_name":"Kronecker delta","level":2,"score":0.21159353852272034},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3440016","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3440016","pdf_url":null,"source":{"id":"https://openalex.org/S96198239","display_name":"ACM Journal on Emerging Technologies in Computing Systems","issn_l":"1550-4832","issn":["1550-4832","1550-4840"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Journal on Emerging Technologies in Computing Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1576347883","https://openalex.org/W1591801644","https://openalex.org/W1919191429","https://openalex.org/W2064675550","https://openalex.org/W2100659887","https://openalex.org/W2112796928","https://openalex.org/W2126511896","https://openalex.org/W2131524184","https://openalex.org/W2131774270","https://openalex.org/W2197984537","https://openalex.org/W2198190323","https://openalex.org/W2257163152","https://openalex.org/W2260663238","https://openalex.org/W2402302915","https://openalex.org/W2593303827","https://openalex.org/W2605203995","https://openalex.org/W2617991662","https://openalex.org/W2620263509","https://openalex.org/W2890309926","https://openalex.org/W2915589364","https://openalex.org/W2927608232","https://openalex.org/W2949896761","https://openalex.org/W2950635152","https://openalex.org/W2952344559","https://openalex.org/W2952899695","https://openalex.org/W2962820060","https://openalex.org/W2963396654","https://openalex.org/W2963656894","https://openalex.org/W2982011653","https://openalex.org/W3001665736","https://openalex.org/W3002071578","https://openalex.org/W3034226764","https://openalex.org/W3034893304","https://openalex.org/W3096109293","https://openalex.org/W3097185144","https://openalex.org/W3101111100","https://openalex.org/W3105347474","https://openalex.org/W4320800818"],"related_works":["https://openalex.org/W2361878581","https://openalex.org/W2073634779","https://openalex.org/W4225394202","https://openalex.org/W4298287631","https://openalex.org/W2953061907","https://openalex.org/W3032952384","https://openalex.org/W3034302643","https://openalex.org/W1847088711","https://openalex.org/W3036642985","https://openalex.org/W326456911"],"abstract_inverted_index":{"Micro-controllers":[0],"(MCUs)":[1],"make":[2],"up":[3],"most":[4],"of":[5,21,39,75,223],"the":[6,9,109,128,137,163,177,181,207],"processors":[7],"in":[8],"world":[10],"with":[11,29,122,145],"widespread":[12],"applicability":[13],"from":[14],"automobile":[15],"to":[16,24,33,65,102,120,131,140,196,212],"medical":[17],"devices.":[18],"The":[19],"Internet":[20,38],"Things":[22,40],"promises":[23],"enable":[25],"these":[26,68],"resource-constrained":[27,106],"MCUs":[28],"machine":[30],"learning":[31],"algorithms":[32],"provide":[34],"always-on":[35],"intelligence.":[36],"Many":[37],"applications":[41,156],"consume":[42],"time-series":[43],"data":[44],"that":[45,87,159],"are":[46],"naturally":[47],"suitable":[48],"for":[49,84,105],"recurrent":[50],"neural":[51],"networks":[52],"(RNNs)":[53],"like":[54],"LSTMs":[55],"and":[56,63,157],"GRUs.":[57],"However,":[58],"RNNs":[59,91,104],"can":[60,88,114,161,185],"be":[61],"large":[62,172],"difficult":[64],"deploy":[66],"on":[67],"devices,":[69],"as":[70],"they":[71],"have":[72],"few":[73],"kilobytes":[74],"memory.":[76],"As":[77],"a":[78,82,100,171,192,220],"result,":[79],"there":[80],"is":[81],"need":[83],"compression":[85,138,148,183,208,217],"techniques":[86,149,169],"significantly":[89],"compress":[90,103,115],"without":[92],"negatively":[93],"impacting":[94],"task":[95,164],"accuracy.":[96],"This":[97],"article":[98],"introduces":[99],"method":[101],"environments":[107],"using":[108],"Kronecker":[110],"product":[111],"(KP).":[112],"KPs":[113],"RNN":[116],"layers":[117],"by":[118,167,170,218],"16\u00d7":[119],"38\u00d7":[121],"minimal":[123],"accuracy":[124,165,188,214],"loss.":[125,189],"By":[126],"quantizing":[127],"resulting":[129],"models":[130],"8":[132],"bits,":[133],"we":[134],"further":[135],"push":[136],"factor":[139],"50\u00d7.":[141],"We":[142,190],"compare":[143],"KP":[144,160,182,194,201],"other":[146,168],"state-of-the-art":[147],"across":[150],"seven":[151],"benchmarks":[152],"spanning":[153],"five":[154],"different":[155],"show":[158],"beat":[162],"achieved":[166],"margin":[173],"while":[174],"simultaneously":[175],"improving":[176],"inference":[178],"runtime.":[179],"Sometimes":[180],"mechanism":[184],"introduce":[186],"an":[187],"develop":[191],"hybrid":[193,200],"approach":[195],"mitigate":[197],"this.":[198],"Our":[199],"algorithm":[202],"provides":[203],"fine-grained":[204],"control":[205],"over":[206],"ratio,":[209],"enabling":[210],"us":[211],"regain":[213],"lost":[215],"during":[216],"adding":[219],"small":[221],"number":[222],"model":[224],"parameters.":[225]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
