{"id":"https://openalex.org/W4388543812","doi":"https://doi.org/10.1109/jiot.2023.3331654","title":"Enabling ImageNet-Scale Deep Learning on MCUs for Accurate and Efficient Inference","display_name":"Enabling ImageNet-Scale Deep Learning on MCUs for Accurate and Efficient Inference","publication_year":2023,"publication_date":"2023-11-09","ids":{"openalex":"https://openalex.org/W4388543812","doi":"https://doi.org/10.1109/jiot.2023.3331654"},"language":"en","primary_location":{"id":"doi:10.1109/jiot.2023.3331654","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2023.3331654","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024765022","display_name":"Sulaiman Sadiq","orcid":"https://orcid.org/0000-0003-4959-4623"},"institutions":[{"id":"https://openalex.org/I43439940","display_name":"University of Southampton","ror":"https://ror.org/01ryk1543","country_code":"GB","type":"education","lineage":["https://openalex.org/I43439940"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sulaiman Sadiq","raw_affiliation_strings":["Department of Electronics and Computer Science, University of Southampton, Southampton, U.K"],"raw_orcid":"https://orcid.org/0000-0003-4959-4623","affiliations":[{"raw_affiliation_string":"Department of Electronics and Computer Science, University of Southampton, Southampton, U.K","institution_ids":["https://openalex.org/I43439940"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067505586","display_name":"Jonathon Hare","orcid":"https://orcid.org/0000-0003-2921-4283"},"institutions":[{"id":"https://openalex.org/I43439940","display_name":"University of Southampton","ror":"https://ror.org/01ryk1543","country_code":"GB","type":"education","lineage":["https://openalex.org/I43439940"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jonathon Hare","raw_affiliation_strings":["Department of Electronics and Computer Science, University of Southampton, Southampton, U.K"],"raw_orcid":"https://orcid.org/0000-0003-2921-4283","affiliations":[{"raw_affiliation_string":"Department of Electronics and Computer Science, University of Southampton, Southampton, U.K","institution_ids":["https://openalex.org/I43439940"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008802851","display_name":"Simon Craske","orcid":null},"institutions":[{"id":"https://openalex.org/I2801109035","display_name":"ARM (United Kingdom)","ror":"https://ror.org/04mmhzs81","country_code":"GB","type":"company","lineage":["https://openalex.org/I2801109035"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Simon Craske","raw_affiliation_strings":["Central Technology Group, ARM Ltd., Cambridge, U.K"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Central Technology Group, ARM Ltd., Cambridge, U.K","institution_ids":["https://openalex.org/I2801109035"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016261879","display_name":"Partha Maji","orcid":"https://orcid.org/0000-0002-1919-1228"},"institutions":[{"id":"https://openalex.org/I4210121368","display_name":"Machine Science","ror":"https://ror.org/02hrr9v50","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210121368"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Partha Maji","raw_affiliation_strings":["Machine Learning Department, Tenstorrent, Cambridge, U.K"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Machine Learning Department, Tenstorrent, Cambridge, U.K","institution_ids":["https://openalex.org/I4210121368"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001556143","display_name":"Geoff V. Merrett","orcid":"https://orcid.org/0000-0003-4980-3894"},"institutions":[{"id":"https://openalex.org/I43439940","display_name":"University of Southampton","ror":"https://ror.org/01ryk1543","country_code":"GB","type":"education","lineage":["https://openalex.org/I43439940"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Geoff Merrett","raw_affiliation_strings":["Department of Electronics and Computer Science, University of Southampton, Southampton, U.K"],"raw_orcid":"https://orcid.org/0000-0003-4980-3894","affiliations":[{"raw_affiliation_string":"Department of Electronics and Computer Science, University of Southampton, Southampton, U.K","institution_ids":["https://openalex.org/I43439940"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.7859,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.74698042,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"11","issue":"7","first_page":"11471","last_page":"11479"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7920858263969421},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7865021228790283},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.6921301484107971},{"id":"https://openalex.org/keywords/microcontroller","display_name":"Microcontroller","score":0.6270347833633423},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5762313604354858},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4582492709159851},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.438434362411499},{"id":"https://openalex.org/keywords/auxiliary-memory","display_name":"Auxiliary memory","score":0.43295592069625854},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.37380552291870117},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3246697783470154},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.2056603729724884}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7920858263969421},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7865021228790283},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.6921301484107971},{"id":"https://openalex.org/C173018170","wikidata":"https://www.wikidata.org/wiki/Q165678","display_name":"Microcontroller","level":2,"score":0.6270347833633423},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5762313604354858},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4582492709159851},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.438434362411499},{"id":"https://openalex.org/C82687282","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Auxiliary memory","level":2,"score":0.43295592069625854},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.37380552291870117},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3246697783470154},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.2056603729724884},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/jiot.2023.3331654","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2023.3331654","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},{"id":"pmh:oai:eprints.soton.ac.uk:483972","is_oa":false,"landing_page_url":"http://doi.org/10.1109/JIOT.2023.3331654>).","pdf_url":null,"source":{"id":"https://openalex.org/S4306401019","display_name":"ePrints Soton (University of Southampton)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I43439940","host_organization_name":"University of Southampton","host_organization_lineage":["https://openalex.org/I43439940"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3496335909","display_name":"Centre for Spatial Computational Learning","funder_award_id":"EP/S030069/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G4587427570","display_name":null,"funder_award_id":"EP/S030069/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6750118813","display_name":null,"funder_award_id":"EP/S024298/1","funder_id":"https://openalex.org/F4320314731","funder_display_name":"UK Research and Innovation"}],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"},{"id":"https://openalex.org/F4320316514","display_name":"Arm","ror":"https://ror.org/04mmhzs81"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W2058401212","https://openalex.org/W2160815625","https://openalex.org/W2194775991","https://openalex.org/W2524428287","https://openalex.org/W2784372305","https://openalex.org/W2786027963","https://openalex.org/W2909545524","https://openalex.org/W2924533679","https://openalex.org/W2963163009","https://openalex.org/W2963918968","https://openalex.org/W2967733054","https://openalex.org/W2982083293","https://openalex.org/W2998696623","https://openalex.org/W3007729836","https://openalex.org/W3013186616","https://openalex.org/W3049586678","https://openalex.org/W3137875211","https://openalex.org/W3160945783","https://openalex.org/W4284899413","https://openalex.org/W4284974526","https://openalex.org/W4292794010","https://openalex.org/W4297775537","https://openalex.org/W4385245566","https://openalex.org/W6639703010","https://openalex.org/W6677103964","https://openalex.org/W6677580257","https://openalex.org/W6727208969","https://openalex.org/W6730047919","https://openalex.org/W6737664043","https://openalex.org/W6747876305","https://openalex.org/W6756887525","https://openalex.org/W6762610423","https://openalex.org/W6762718338","https://openalex.org/W6762754082","https://openalex.org/W6765643347","https://openalex.org/W6775717222","https://openalex.org/W6780827055","https://openalex.org/W6784225549","https://openalex.org/W6784581357","https://openalex.org/W6788927946","https://openalex.org/W6797184042","https://openalex.org/W6803926790","https://openalex.org/W6839700459","https://openalex.org/W6922480057"],"related_works":["https://openalex.org/W4316095964","https://openalex.org/W2770234245","https://openalex.org/W96612179","https://openalex.org/W4229499248","https://openalex.org/W2566006169","https://openalex.org/W1567818861","https://openalex.org/W2987774938","https://openalex.org/W4256492088","https://openalex.org/W2383001583","https://openalex.org/W632915154"],"abstract_inverted_index":{"Conventional":[0],"approaches":[1],"to":[2,49,105,139,172,187],"Tiny":[3],"Machine":[4],"Learning":[5],"(TinyML)":[6],"achieve":[7],"high":[8,63],"accuracy":[9,60,175],"by":[10,29],"deploying":[11],"the":[12,18,25,30,72,84,114,126,141,153],"largest":[13],"deep":[14],"learning":[15],"model":[16],"with":[17,77,170],"highest":[19],"input":[20],"resolutions":[21],"that":[22,51,70],"fit":[23],"within":[24,54],"size":[26],"constraints":[27,56,85],"imposed":[28],"microcontroller\u2019s":[31],"(MCUs)":[32],"fast":[33],"internal":[34,87,107,189],"storage":[35,108],"and":[36,98,109,134,176],"memory.":[37,88],"In":[38],"this":[39],"article,":[40],"we":[41,123,148],"perform":[42],"an":[43,67],"in-depth":[44],"analysis":[45],"of":[46,74,86,94,117,160],"prior":[47],"works":[48],"show":[50],"models":[52,76,151],"derived":[53],"these":[55],"suffer":[57],"from":[58,83,145,152],"low":[59,78],"and,":[61],"surprisingly,":[62],"latency.":[64,142],"We":[65,89],"propose":[66],"alternative":[68],"approach":[69],"enables":[71],"deployment":[73],"efficient":[75,150],"inference":[79,121,128],"latency,":[80,122],"but":[81,101],"free":[82],"take":[90],"a":[91,158],"holistic":[92],"view":[93],"typical":[95],"MCU":[96],"architectures":[97],"utilize":[99],"plentiful":[100],"slower":[102],"external":[103,118],"memories":[104],"relax":[106],"memory":[110,119,190],"constraints.":[111],"To":[112],"avoid":[113],"lower":[115],"speed":[116],"impacting":[120],"build":[124],"on":[125,166],"TinyOps":[127,154],"framework,":[129],"which":[130],"performs":[131],"operation":[132],"partitioning":[133],"uses":[135],"overlays":[136],"via":[137],"DMA,":[138],"accelerate":[140],"Using":[143],"insights":[144],"our":[146],"study,":[147],"deploy":[149],"design":[155],"space":[156],"onto":[157],"range":[159],"embedded":[161],"MCUs":[162],"achieving":[163],"record":[164],"performance":[165],"TinyML":[167],"ImageNet":[168],"classification":[169],"up":[171],"6.7%":[173],"higher":[174],"<inline-formula":[177],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[178],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[179],"<tex-math":[180],"notation=\"LaTeX\">$1.4\\times":[181],"$":[182],"</tex-math></inline-formula>":[183],"faster":[184],"latency":[185],"compared":[186],"state-of-the-art":[188],"approaches.":[191]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
