{"id":"https://openalex.org/W4416472425","doi":"https://doi.org/10.1145/3680207.3765247","title":"AdaptQNet: Optimizing Quantized DNN on Microcontrollers via Adaptive Heterogeneous Processing Unit Utilization","display_name":"AdaptQNet: Optimizing Quantized DNN on Microcontrollers via Adaptive Heterogeneous Processing Unit Utilization","publication_year":2025,"publication_date":"2025-11-03","ids":{"openalex":"https://openalex.org/W4416472425","doi":"https://doi.org/10.1145/3680207.3765247"},"language":null,"primary_location":{"id":"doi:10.1145/3680207.3765247","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3680207.3765247","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st Annual International Conference on Mobile Computing and Networking","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111967675","display_name":"Yafei Sun","orcid":"https://orcid.org/0009-0005-5477-1059"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yansong Sun","raw_affiliation_strings":["Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101955964","display_name":"Jialuo He","orcid":"https://orcid.org/0009-0004-6461-3866"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jialuo He","raw_affiliation_strings":["Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043302724","display_name":"Dirk Kutscher","orcid":"https://orcid.org/0000-0002-9021-9916"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dirk Kutscher","raw_affiliation_strings":["Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014199941","display_name":"Huangxun Chen","orcid":"https://orcid.org/0000-0002-0313-4421"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huangxun Chen","raw_affiliation_strings":["Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5111967675"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.35763399,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"802","last_page":"816"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.16740000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.16740000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.14489999413490295,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.11400000005960464,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/microcontroller","display_name":"Microcontroller","score":0.673799991607666},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6209999918937683},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5358999967575073},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5097000002861023},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4812000095844269},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4756999909877777},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4189999997615814},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.39320001006126404}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7874000072479248},{"id":"https://openalex.org/C173018170","wikidata":"https://www.wikidata.org/wiki/Q165678","display_name":"Microcontroller","level":2,"score":0.673799991607666},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6209999918937683},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5358999967575073},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5097000002861023},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4812000095844269},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4756999909877777},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4189999997615814},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4050000011920929},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3986999988555908},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.39500001072883606},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.39320001006126404},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.38260000944137573},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3131999969482422},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.29100000858306885},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.28600001335144043},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.2856999933719635},{"id":"https://openalex.org/C46743427","wikidata":"https://www.wikidata.org/wiki/Q1341685","display_name":"Inference engine","level":3,"score":0.2815999984741211},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2773999869823456},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.26829999685287476},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.2667999863624573},{"id":"https://openalex.org/C3017813396","wikidata":"https://www.wikidata.org/wiki/Q17078173","display_name":"Resource constraints","level":2,"score":0.26669999957084656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26489999890327454},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.263700008392334},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.25859999656677246},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3680207.3765247","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3680207.3765247","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st Annual International Conference on Mobile Computing and Networking","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2931092525","https://openalex.org/W2963122961","https://openalex.org/W2963163009","https://openalex.org/W2982083293","https://openalex.org/W2982479999","https://openalex.org/W3013186616","https://openalex.org/W3165698711","https://openalex.org/W4283020086","https://openalex.org/W4380926962","https://openalex.org/W4380928297","https://openalex.org/W4386607611","https://openalex.org/W4403636552","https://openalex.org/W4404132984","https://openalex.org/W4404133524","https://openalex.org/W4405013858"],"related_works":[],"abstract_inverted_index":{"There":[0],"is":[1],"a":[2,62,86,103],"growing":[3],"trend":[4],"in":[5,16,34,73,113],"deploying":[6],"DNNs":[7],"on":[8,61,119,160],"tiny":[9],"microcontroller":[10],"(MCUs)":[11],"to":[12,27,135,140],"provide":[13],"inference":[14,36],"capabilities":[15,71,134],"the":[17,95,108,125,152],"IoT.":[18],"While":[19],"prior":[20],"research":[21],"has":[22],"explored":[23],"many":[24,74],"lightweight":[25],"techniques":[26],"compress":[28],"DNN":[29,104,114],"models,":[30],"achieving":[31],"overall":[32],"efficiency":[33],"model":[35,40],"requires":[37],"not":[38],"only":[39],"optimization":[41],"but":[42],"also":[43],"careful":[44],"system":[45,91],"resource":[46],"utilization":[47],"for":[48,58,99],"execution.":[49],"Existing":[50],"studies":[51],"primarily":[52],"leverage":[53],"arithmetic":[54],"logic":[55],"units":[56,67],"(ALUs)":[57],"integer-only":[59],"computations":[60],"single":[63],"CPU":[64],"core.":[65],"Floating-point":[66],"(FPU)":[68],"and":[69,132,146],"multi-core":[70,133],"available":[72],"existing":[75],"MCUs":[76],"remain":[77],"underutilized.":[78],"To":[79],"fill":[80],"this":[81],"gap,":[82],"we":[83],"propose":[84],"AdaptQNet,":[85],"novel":[87],"MCU":[88],"neural":[89],"network":[90],"that":[92,129,149],"can":[93],"determine":[94],"optimal":[96],"precision":[97],"assignment":[98],"different":[100,117],"layers":[101],"of":[102,110,127,154],"model.":[105],"AdaptQNet":[106,150],"models":[107,115,128,155],"latency":[109],"various":[111],"operators":[112],"across":[116],"precisions":[118],"heterogeneous":[120],"processing":[121],"units.":[122],"This":[123],"facilitates":[124],"discovery":[126],"utilize":[130],"FPU":[131],"enhance":[136],"capacity":[137],"while":[138],"adhering":[139],"stringent":[141],"memory":[142],"constraints.":[143],"Our":[144],"implementation":[145],"experiments":[147],"demonstrate":[148],"enables":[151],"deployment":[153],"with":[156],"better":[157],"accuracy-efficiency":[158],"trade-off":[159],"MCUs.":[161]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-11-23T00:00:00"}
