{"id":"https://openalex.org/W4391272049","doi":"https://doi.org/10.48550/arxiv.2401.13714","title":"Value-Driven Mixed-Precision Quantization for Patch-Based Inference on Microcontrollers","display_name":"Value-Driven Mixed-Precision Quantization for Patch-Based Inference on Microcontrollers","publication_year":2024,"publication_date":"2024-01-24","ids":{"openalex":"https://openalex.org/W4391272049","doi":"https://doi.org/10.48550/arxiv.2401.13714"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2401.13714","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.13714","pdf_url":"https://arxiv.org/pdf/2401.13714","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2401.13714","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046355512","display_name":"Wei Tao","orcid":"https://orcid.org/0000-0002-8273-6649"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tao, Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101353824","display_name":"Shenglin He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Shenglin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100625354","display_name":"Kai L\u00fc","orcid":"https://orcid.org/0000-0002-6378-7002"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Kai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100940847","display_name":"Xiaoyang Qu","orcid":"https://orcid.org/0009-0009-6311-4332"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qu, Xiaoyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009868061","display_name":"Guokuan Li","orcid":"https://orcid.org/0009-0005-7998-5520"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Guokuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044866795","display_name":"Jiguang Wan","orcid":"https://orcid.org/0000-0003-3440-4460"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wan, Jiguang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074472751","display_name":"Jianzong Wang","orcid":"https://orcid.org/0000-0002-9237-4231"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Jianzong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5016038454","display_name":"Jing Xiao","orcid":"https://orcid.org/0000-0001-9615-4749"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Jing","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5046355512"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9764999747276306,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9764999747276306,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9753999710083008,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9732999801635742,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7442363500595093},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.7093479633331299},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.695609450340271},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6067180633544922},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.5924874544143677},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.5590577721595764},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.4882538616657257},{"id":"https://openalex.org/keywords/microcontroller","display_name":"Microcontroller","score":0.45848697423934937},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.42732787132263184},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3215469717979431},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3210110664367676},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.24202293157577515},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.09164151549339294}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7442363500595093},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.7093479633331299},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.695609450340271},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6067180633544922},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.5924874544143677},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.5590577721595764},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.4882538616657257},{"id":"https://openalex.org/C173018170","wikidata":"https://www.wikidata.org/wiki/Q165678","display_name":"Microcontroller","level":2,"score":0.45848697423934937},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.42732787132263184},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3215469717979431},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3210110664367676},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.24202293157577515},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.09164151549339294}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2401.13714","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.13714","pdf_url":"https://arxiv.org/pdf/2401.13714","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2401.13714","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2401.13714","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2401.13714","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.13714","pdf_url":"https://arxiv.org/pdf/2401.13714","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321883","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53"},{"id":"https://openalex.org/F4320336405","display_name":"Special Project for Research and Development in Key areas of Guangdong Province","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391272049.pdf","grobid_xml":"https://content.openalex.org/works/W4391272049.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2293118914","https://openalex.org/W2998381397","https://openalex.org/W4236419692","https://openalex.org/W2058965144","https://openalex.org/W2164382479","https://openalex.org/W3167919718","https://openalex.org/W4251718783","https://openalex.org/W2171015181","https://openalex.org/W4239447582","https://openalex.org/W2187181201"],"abstract_inverted_index":{"Deploying":[0],"neural":[1],"networks":[2],"on":[3,113,132,151,214,226],"microcontroller":[4],"units":[5],"(MCUs)":[6],"presents":[7],"substantial":[8,46],"challenges":[9,65],"due":[10],"to":[11,27,44,54,90,101,128,160,188,198,206,234],"their":[12,156],"constrained":[13],"computation":[14,41,177,223],"and":[15,69,178,180],"memory":[16,29],"resources.":[17],"Previous":[18],"researches":[19],"have":[20],"explored":[21],"patch-based":[22,82,237],"inference":[23,83,238],"as":[24,184],"a":[25,45,70,80,167],"strategy":[26],"conserve":[28],"without":[30,142],"sacrificing":[31],"model":[32,104,231],"accuracy.":[33,105],"However,":[34],"this":[35,56,75],"technique":[36],"suffers":[37],"from":[38],"severe":[39],"redundant":[40,92],"overhead,":[42],"leading":[43],"increase":[47],"in":[48],"execution":[49],"latency.":[50],"A":[51],"feasible":[52],"solution":[53],"address":[55],"issue":[57],"is":[58],"mixed-precision":[59,88],"quantization,":[60],"but":[61],"it":[62,181],"faces":[63],"the":[64,103,129,133,152,200,209,235],"of":[66,155,202],"accuracy":[67,186,232],"degradation":[68],"time-consuming":[71],"search":[72,149,162,170,210],"time.":[73,163],"In":[74,138],"paper,":[76],"we":[77,124,145],"propose":[78],"QuantMCU,":[79],"novel":[81,168],"method":[84],"that":[85,136,172,219],"utilizes":[86],"value-driven":[87,97,147],"quantization":[89,127,148,169],"reduce":[91,161,222],"computation.":[93],"We":[94],"first":[95],"utilize":[96,146],"patch":[98],"classification":[99],"(VDPC)":[100],"maintain":[102],"VDPC":[106],"classifies":[107],"patches":[108,120,141],"into":[109,174],"two":[110],"classes":[111],"based":[112],"whether":[114],"they":[115],"contain":[116],"outlier":[117,122,143],"values.":[118],"For":[119],"containing":[121],"values,":[123,144],"apply":[125],"8-bit":[126],"feature":[130,153,204],"maps":[131,154],"dataflow":[134,158],"branches":[135,159],"follow.":[137],"addition,":[139],"for":[140],"(VDQS)":[150],"following":[157],"Specifically,":[164],"VDQS":[165,192],"introduces":[166],"metric":[171],"takes":[173],"account":[175],"both":[176],"accuracy,":[179],"employs":[182],"entropy":[183],"an":[185,195],"representation":[187],"avoid":[189],"additional":[190],"training.":[191],"also":[193],"adopts":[194],"iterative":[196],"approach":[197],"determine":[199],"bitwidth":[201],"each":[203],"map":[205],"further":[207],"accelerate":[208],"process.":[211],"Experimental":[212],"results":[213],"real-world":[215],"MCU":[216],"devices":[217],"show":[218],"QuantMCU":[220],"can":[221],"by":[224],"2.2x":[225],"average":[227],"while":[228],"maintaining":[229],"comparable":[230],"compared":[233],"state-of-the-art":[236],"methods.":[239]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
