{"id":"https://openalex.org/W7160962456","doi":"https://doi.org/10.48550/arxiv.2605.09357","title":"Split CNN Inference on Networked Microcontrollers","display_name":"Split CNN Inference on Networked Microcontrollers","publication_year":2026,"publication_date":"2026-05-10","ids":{"openalex":"https://openalex.org/W7160962456","doi":"https://doi.org/10.48550/arxiv.2605.09357"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.09357","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.09357","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.09357","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020556154","display_name":"Junyu Lu","orcid":"https://orcid.org/0000-0003-2632-8736"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Junyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135955685","display_name":"Shashwath Suresh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Suresh, Shashwath","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135944371","display_name":"Hao Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135934786","display_name":"Qi Hong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hong, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135935845","display_name":"Qing Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Qing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8046000003814697,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8046000003814697,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.024800000712275505,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.021199999377131462,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7573999762535095},{"id":"https://openalex.org/keywords/microcontroller","display_name":"Microcontroller","score":0.7267000079154968},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6593999862670898},{"id":"https://openalex.org/keywords/testbed","display_name":"Testbed","score":0.5871999859809875},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5288000106811523},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.520799994468689},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.4481000006198883},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.398499995470047}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7975999712944031},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7573999762535095},{"id":"https://openalex.org/C173018170","wikidata":"https://www.wikidata.org/wiki/Q165678","display_name":"Microcontroller","level":2,"score":0.7267000079154968},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6593999862670898},{"id":"https://openalex.org/C31395832","wikidata":"https://www.wikidata.org/wiki/Q1318674","display_name":"Testbed","level":2,"score":0.5871999859809875},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5288000106811523},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.520799994468689},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.4481000006198883},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.398499995470047},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38440001010894775},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.36340001225471497},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.35580000281333923},{"id":"https://openalex.org/C46743427","wikidata":"https://www.wikidata.org/wiki/Q1341685","display_name":"Inference engine","level":3,"score":0.34549999237060547},{"id":"https://openalex.org/C28362024","wikidata":"https://www.wikidata.org/wiki/Q2067413","display_name":"Thrashing","level":2,"score":0.3224000036716461},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.320499986410141},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C12186640","wikidata":"https://www.wikidata.org/wiki/Q6815743","display_name":"Memory model","level":3,"score":0.31369999051094055},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.3046000003814697},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.28380000591278076},{"id":"https://openalex.org/C2777062904","wikidata":"https://www.wikidata.org/wiki/Q545406","display_name":"Toolchain","level":3,"score":0.2696000039577484},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25529998540878296},{"id":"https://openalex.org/C101722063","wikidata":"https://www.wikidata.org/wiki/Q218825","display_name":"Random access","level":2,"score":0.2551000118255615},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.09357","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.09357","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.09357","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.09357","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Running":[0],"deep":[1],"neural":[2],"networks":[3],"on":[4,50,138,145,164],"microcontroller":[5],"units":[6],"(MCUs)":[7],"is":[8,82],"severely":[9],"constrained":[10],"by":[11,40],"limited":[12],"memory":[13,86],"resources.":[14,132],"While":[15],"TinyML":[16],"techniques":[17],"reduce":[18],"model":[19,112],"size":[20],"and":[21,106,109,114,142],"computation,":[22],"they":[23],"often":[24],"fail":[25],"in":[26],"practice":[27],"due":[28],"to":[29,103,147],"excessive":[30],"peak":[31,177],"Random":[32],"Access":[33],"Memory":[34],"(RAM)":[35],"usage":[36,179],"during":[37],"inference,":[38],"dominated":[39],"intermediate":[41,115],"activations.":[42],"As":[43],"a":[44,58,139,152,165],"result,":[45],"many":[46],"models":[47,75,102,162],"remain":[48],"infeasible":[49,163],"standalone":[51],"MCUs.":[52,119],"In":[53],"this":[54,192],"work,":[55],"we":[56],"present":[57],"fine-grained":[59],"split":[60],"inference":[61,69,90,126,185],"system":[62,137],"for":[63],"networked":[64,172],"MCUs":[65,149],"that":[66,83,160],"enables":[67],"collaborative":[68],"of":[70,191],"Convolutional":[71],"Neural":[72],"Networks":[73],"(CNN)":[74],"across":[76,117,127,171],"multiple":[77,118],"devices.":[78],"Our":[79,156],"key":[80],"insight":[81],"breaking":[84],"the":[85,125,135,175,182,188],"bottleneck":[87],"requires":[88],"splitting":[89],"at":[91,96],"sub-layer":[92],"granularity":[93],"rather":[94],"than":[95],"layer":[97],"boundaries.":[98],"We":[99,133],"reinterpret":[100],"pre-trained":[101],"enable":[104],"kernel-wise":[105],"neuron-wise":[107],"partitioning,":[108],"distribute":[110],"both":[111],"parameters":[113],"activations":[116],"A":[120],"lightweight,":[121],"resource-aware":[122],"coordinator":[123],"orchestrates":[124],"MCU":[128,167],"devices":[129],"with":[130],"heterogeneous":[131],"implement":[134],"proposed":[136],"real":[140],"testbed":[141],"evaluate":[143],"it":[144],"up":[146],"8":[148],"using":[150],"MobileNetV2,":[151],"representative":[153],"CNN":[154,161],"model.":[155],"experimental":[157],"results":[158],"show":[159],"single":[166],"can":[168,194],"be":[169,195],"executed":[170],"MCUs,":[173],"reducing":[174],"per-MCU":[176],"RAM":[178],"while":[180],"maintaining":[181],"practical":[183],"end-to-end":[184],"latency.":[186],"All":[187],"source":[189],"code":[190],"work":[193],"found":[196],"here:":[197],"https://github.com/shashsuresh/split-inference-on-MCUs.":[198]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-13T00:00:00"}
