{"id":"https://openalex.org/W4399411982","doi":"https://doi.org/10.1109/tcad.2024.3410841","title":"Automatic Mapping of Heterogeneous DNN Models on Adaptive Multiaccelerator Systems","display_name":"Automatic Mapping of Heterogeneous DNN Models on Adaptive Multiaccelerator Systems","publication_year":2024,"publication_date":"2024-06-06","ids":{"openalex":"https://openalex.org/W4399411982","doi":"https://doi.org/10.1109/tcad.2024.3410841"},"language":"en","primary_location":{"id":"doi:10.1109/tcad.2024.3410841","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2024.3410841","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047571832","display_name":"Jieru Zhao","orcid":"https://orcid.org/0000-0001-8211-2812"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jieru Zhao","raw_affiliation_strings":["Department of CSE, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of CSE, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043486076","display_name":"Guan Shen","orcid":"https://orcid.org/0000-0002-1264-8715"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guan Shen","raw_affiliation_strings":["Department of CSE, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of CSE, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102769588","display_name":"Wenchao Ding","orcid":"https://orcid.org/0000-0003-4249-526X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenchao Ding","raw_affiliation_strings":["Fudan University, Shanghai, China","Academy for Engineering and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"Academy for Engineering and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100377840","display_name":"Quan Chen","orcid":"https://orcid.org/0000-0001-5832-0347"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quan Chen","raw_affiliation_strings":["Department of CSE, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of CSE, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039318240","display_name":"Minyi Guo","orcid":"https://orcid.org/0000-0003-0034-2302"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minyi Guo","raw_affiliation_strings":["Department of CSE, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of CSE, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5047571832"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06588616,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"43","issue":"12","first_page":"4701","last_page":"4714"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9114999771118164,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9114999771118164,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10346","display_name":"Magnetic confinement fusion research","score":0.9002000093460083,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6592277884483337}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6592277884483337}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcad.2024.3410841","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2024.3410841","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.5099999904632568}],"awards":[{"id":"https://openalex.org/G5813330169","display_name":null,"funder_award_id":"62102249","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7918780534","display_name":null,"funder_award_id":"62472273","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8136545603","display_name":null,"funder_award_id":"62232015","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2625954420","https://openalex.org/W2883929540","https://openalex.org/W2913221350","https://openalex.org/W2945306514","https://openalex.org/W2962953210","https://openalex.org/W2964137095","https://openalex.org/W2969289739","https://openalex.org/W3006377070","https://openalex.org/W3012249773","https://openalex.org/W3025152414","https://openalex.org/W3096425133","https://openalex.org/W3096609285","https://openalex.org/W3158233068","https://openalex.org/W3187788856","https://openalex.org/W3196923642","https://openalex.org/W4280489237","https://openalex.org/W4286001027","https://openalex.org/W4293025058","https://openalex.org/W4293025165","https://openalex.org/W4312933868","https://openalex.org/W4386764246","https://openalex.org/W4387321091","https://openalex.org/W4389518760","https://openalex.org/W4389976716","https://openalex.org/W4390874575","https://openalex.org/W4392450088","https://openalex.org/W4393153751","https://openalex.org/W6637373629","https://openalex.org/W6684191040","https://openalex.org/W6748324931","https://openalex.org/W6766904570","https://openalex.org/W6766978945","https://openalex.org/W6767997687","https://openalex.org/W6770820644","https://openalex.org/W6800139874","https://openalex.org/W6811928498","https://openalex.org/W6854866820","https://openalex.org/W6857332069"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"As":[0,29],"DNNs":[1],"are":[2],"developing":[3],"rapidly,":[4],"the":[5,83,114,120,124,149,160],"computational":[6],"and":[7,26,37,50,67,79,100,116,151],"memory":[8],"burden":[9],"imposed":[10],"on":[11,155],"hardware":[12],"systems":[13,42],"grows":[14],"exponentially.":[15],"This":[16],"becomes":[17],"even":[18],"more":[19],"severe":[20],"for":[21,69,144],"large":[22],"language":[23],"models":[24,157],"(LLMs)":[25],"multimodal":[27],"models.":[28],"a":[30,54,59,91],"promising":[31],"solution":[32],"that":[33,95,138],"achieves":[34,140],"high":[35,121],"scalability":[36],"low":[38],"manufacturing":[39],"cost,":[40],"multiaccelerator":[41],"widely":[43],"exist":[44],"in":[45,82],"data":[46],"centers,":[47],"cloud":[48],"platforms,":[49],"mobile":[51],"SoCs.":[52],"Thus,":[53],"challenging":[55],"problem":[56],"arises:":[57],"selecting":[58],"proper":[60],"combination":[61],"of":[62,123],"accelerators":[63],"from":[64],"available":[65],"designs":[66],"searching":[68],"efficient":[70],"DNN":[71,145],"mapping":[72,93,131],"strategies,":[73],"to":[74,105,112,133,148,159],"fully":[75],"exploit":[76],"computation":[77,115],"resources":[78],"communication":[80,117],"bandwidth":[81],"system.":[84],"To":[85],"this":[86],"end,":[87],"we":[88,127],"propose":[89,128],"MARS,":[90],"novel":[92],"framework":[94],"performs":[96],"computation-aware":[97],"accelerator":[98],"selection":[99],"applies":[101],"communication-aware":[102],"sharding":[103],"strategies":[104],"maximize":[106],"parallelism.":[107],"We":[108],"also":[109],"provide":[110],"optimizations":[111],"overlap":[113],"latency.":[118],"Considering":[119],"complexity":[122],"design":[125],"space,":[126],"two":[129],"effective":[130],"algorithms":[132],"explore":[134],"it.":[135],"Experiments":[136],"show":[137],"MARS":[139],"34.3%":[141],"latency":[142,153],"reduction":[143,154],"workloads":[146],"compared":[147,158],"baseline":[150],"63.0%":[152],"heterogeneous":[156],"corresponding":[161],"state-of-the-art":[162],"method.":[163]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
