{"id":"https://openalex.org/W4407736717","doi":"https://doi.org/10.1109/tcad.2025.3543715","title":"Optimizing DNN Inference on Multi-accelerator SoCs at Training-Time","display_name":"Optimizing DNN Inference on Multi-accelerator SoCs at Training-Time","publication_year":2025,"publication_date":"2025-02-19","ids":{"openalex":"https://openalex.org/W4407736717","doi":"https://doi.org/10.1109/tcad.2025.3543715"},"language":"en","primary_location":{"id":"doi:10.1109/tcad.2025.3543715","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2025.3543715","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042082293","display_name":"Matteo Risso","orcid":"https://orcid.org/0000-0002-4641-9742"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Polytechnic University of Turin","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Matteo Risso","raw_affiliation_strings":["Department of Control and Computer Engineering, Politecnico di Torino, Turin, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Control and Computer Engineering, Politecnico di Torino, Turin, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032095821","display_name":"Alessio Burrello","orcid":"https://orcid.org/0000-0002-6215-8220"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Polytechnic University of Turin","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alessio Burrello","raw_affiliation_strings":["Department of Control and Computer Engineering, Politecnico di Torino, Turin, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Control and Computer Engineering, Politecnico di Torino, Turin, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080843266","display_name":"Daniele Jahier Pagliari","orcid":"https://orcid.org/0000-0002-2872-7071"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Polytechnic University of Turin","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Daniele Jahier Pagliari","raw_affiliation_strings":["Department of Control and Computer Engineering, Politecnico di Torino, Turin, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Control and Computer Engineering, Politecnico di Torino, Turin, Italy","institution_ids":["https://openalex.org/I177477856"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5042082293"],"corresponding_institution_ids":["https://openalex.org/I177477856"],"apc_list":null,"apc_paid":null,"fwci":1.4882,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.80636212,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"44","issue":"9","first_page":"3532","last_page":"3545"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11005","display_name":"Radiation Effects in Electronics","score":0.9829000234603882,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11005","display_name":"Radiation Effects in Electronics","score":0.9829000234603882,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11949","display_name":"Nuclear Physics and Applications","score":0.9829000234603882,"subfield":{"id":"https://openalex.org/subfields/3108","display_name":"Radiation"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11044","display_name":"Particle Detector Development and Performance","score":0.9817000031471252,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6910601854324341},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.5862550139427185},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5856615304946899},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3748794198036194},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3647523820400238},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.04632759094238281}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6910601854324341},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.5862550139427185},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5856615304946899},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3748794198036194},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3647523820400238},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.04632759094238281},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcad.2025.3543715","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2025.3543715","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2258208517","display_name":null,"funder_award_id":"101095947","funder_id":"https://openalex.org/F4320319005","funder_display_name":"Key Digital Technologies Joint Undertaking"}],"funders":[{"id":"https://openalex.org/F4320319005","display_name":"Key Digital Technologies Joint Undertaking","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W2108598243","https://openalex.org/W2194775991","https://openalex.org/W2605258629","https://openalex.org/W2807927893","https://openalex.org/W2899641901","https://openalex.org/W2950865323","https://openalex.org/W2963122961","https://openalex.org/W2963918968","https://openalex.org/W2964862330","https://openalex.org/W2965862774","https://openalex.org/W2971002981","https://openalex.org/W2982479999","https://openalex.org/W3016430712","https://openalex.org/W3034887213","https://openalex.org/W3169512402","https://openalex.org/W4206336135","https://openalex.org/W4220837341","https://openalex.org/W4285269946","https://openalex.org/W4285305827","https://openalex.org/W4289828099","https://openalex.org/W4293024010","https://openalex.org/W4297097447","https://openalex.org/W4300171661","https://openalex.org/W4311277703","https://openalex.org/W4312298069","https://openalex.org/W4312998584","https://openalex.org/W4386568606","https://openalex.org/W4386764021","https://openalex.org/W4386764053","https://openalex.org/W4386764983","https://openalex.org/W4386859301","https://openalex.org/W4387444863","https://openalex.org/W4387490516","https://openalex.org/W4391985770","https://openalex.org/W6734593296","https://openalex.org/W6737664043","https://openalex.org/W6752515464","https://openalex.org/W6756887525","https://openalex.org/W6762718338","https://openalex.org/W6770425567","https://openalex.org/W6787972765","https://openalex.org/W6790890768","https://openalex.org/W6811928498"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W230091440","https://openalex.org/W2390279801","https://openalex.org/W2233261550","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2810751659"],"abstract_inverted_index":{"The":[0],"demand":[1],"for":[2],"executing":[3],"deep":[4],"neural":[5,132],"networks":[6,193],"(DNNs)":[7],"with":[8,154,255],"low":[9],"latency":[10,153,200,208],"and":[11,134,175,184],"minimal":[12,256],"power":[13],"consumption":[14,151],"at":[15,227],"the":[16,21,46,92,122,131,140,147,155,160,164,195,207,214,238],"edge":[17],"has":[18],"led":[19],"to":[20,41,56,81,89,145,219,230,244],"development":[22],"of":[23,115,130,163,191,209],"advanced":[24],"heterogeneous":[25,180],"systems-on-chips":[26],"(SoCs)":[27],"that":[28,110,204],"incorporate":[29],"multiple":[30,141],"specialized":[31],"computing":[32],"units":[33],"(CUs),":[34],"such":[35],"as":[36],"accelerators.":[37],"Offloading":[38],"DNN":[39,84,211],"computations":[40],"a":[42,83,107,188,210],"specific":[43],"CU":[44],"from":[45],"available":[47,142],"set":[48],"often":[49],"exposes":[50],"accuracy":[51,97,196,257],"vs":[52],"efficiency":[53],"tradeoffs,":[54],"due":[55],"differences":[57],"in":[58,137,194],"their":[59],"supported":[60],"operations":[61],"(e.g.,":[62,70],"standard":[63],"versus":[64,197],"depthwise":[65],"convolution)":[66],"or":[67,152,199],"data":[68],"representations":[69],"more/less":[71],"aggressively":[72],"quantized).":[73],"A":[74],"challenging":[75],"yet":[76],"unresolved":[77],"issue":[78],"is":[79],"how":[80],"map":[82],"onto":[85],"these":[86],"multi-CU":[87],"systems":[88],"maximally":[90],"exploit":[91],"parallelization":[93],"possibilities":[94],"while":[95],"taking":[96],"into":[98],"account.":[99],"To":[100],"address":[101],"this":[102],"problem,":[103],"we":[104],"present":[105],"ODiMO,":[106],"hardware-aware":[108],"tool":[109],"efficiently":[111],"explores":[112],"fine-grain":[113],"mapping":[114],"DNNs":[116],"among":[117],"various":[118],"on-chip":[119],"CUs,":[120,143],"during":[121],"training":[123],"phase.":[124],"ODiMO":[125,205,241],"strategically":[126],"splits":[127],"individual":[128],"layers":[129],"network":[133],"executes":[135],"them":[136],"parallel":[138],"on":[139,172,213,237],"aiming":[144],"balance":[146],"total":[148],"inference":[149],"energy":[150,198],"resulting":[156],"accuracy,":[157],"impacted":[158],"by":[159,217],"unique":[161],"features":[162],"different":[165],"hardware":[166],"units.":[167],"We":[168,186,202],"test":[169],"our":[170],"approach":[171],"CIFAR-10,":[173],"CIFAR-100,":[174],"ImageNet,":[176],"targeting":[177,235],"two":[178],"open-source":[179],"SoCs,":[181],"i.e.,":[182],"DIANA":[183],"Darkside.":[185],"obtain":[187],"rich":[189],"collection":[190],"Pareto-optimal":[192],"space.":[201],"show":[203],"reduces":[206],"executed":[212],"Darkside":[215],"SoC":[216],"up":[218,243],"<inline-formula":[220,245,259],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[221,246,260],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[222,247,261],"<tex-math":[223,248,262],"notation=\"LaTeX\">$8\\times":[224],"$":[225,250],"</tex-math></inline-formula>":[226,251],"iso-accuracy,":[228],"compared":[229],"manual":[231],"heuristic":[232],"mappings.":[233],"When":[234],"energy,":[236],"same":[239],"SoC,":[240],"produced":[242],"notation=\"LaTeX\">$50.8\\times":[249],"more":[252],"efficient":[253],"mappings,":[254],"drop":[258],"notation=\"LaTeX\">$(\\lt":[263],"0.3\\%)$":[264],"</tex-math></inline-formula>.":[265]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-02-25T23:00:34.991745","created_date":"2025-10-10T00:00:00"}
