{"id":"https://openalex.org/W4402809029","doi":"https://doi.org/10.1109/tpds.2024.3466913","title":"Efficient Schedule Construction for Distributed Execution of Large DNN Models","display_name":"Efficient Schedule Construction for Distributed Execution of Large DNN Models","publication_year":2024,"publication_date":"2024-09-24","ids":{"openalex":"https://openalex.org/W4402809029","doi":"https://doi.org/10.1109/tpds.2024.3466913"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2024.3466913","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tpds.2024.3466913","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027752718","display_name":"Zhiqi Lin","orcid":"https://orcid.org/0000-0002-8050-6196"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiqi Lin","raw_affiliation_strings":["School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","School of Computer Science and Technology, University of Science and Technology of China, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075076538","display_name":"Youshan Miao","orcid":"https://orcid.org/0000-0002-2395-9965"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["CN","GB"],"is_corresponding":false,"raw_author_name":"Youshan Miao","raw_affiliation_strings":["Microsoft Research, Beijing, China","Microsoft Research, U.K"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft Research, U.K","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086274010","display_name":"Guanbin Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanbin Xu","raw_affiliation_strings":["School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","School of Computer Science and Technology, University of Science and Technology of China, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100354226","display_name":"Cheng Li","orcid":"https://orcid.org/0000-0001-7064-6120"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng Li","raw_affiliation_strings":["School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","School of Computer Science and Technology, University of Science and Technology of China, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001454502","display_name":"Olli Saarikivi","orcid":"https://orcid.org/0000-0001-7596-4734"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["CN","GB"],"is_corresponding":false,"raw_author_name":"Olli Saarikivi","raw_affiliation_strings":["Microsoft Research, Beijing, China","Microsoft Research, U.K"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft Research, U.K","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077514991","display_name":"Saeed Maleki","orcid":"https://orcid.org/0000-0003-1107-1827"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]},{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN","GB"],"is_corresponding":false,"raw_author_name":"Saeed Maleki","raw_affiliation_strings":["Microsoft Research, Beijing, China","Microsoft Research, U.K"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft Research, U.K","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101858187","display_name":"Fan Yang","orcid":"https://orcid.org/0000-0002-4113-764X"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["CN","GB"],"is_corresponding":false,"raw_author_name":"Fan Yang","raw_affiliation_strings":["Microsoft Research, Beijing, China","Microsoft Research, U.K"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft Research, U.K","institution_ids":["https://openalex.org/I4210164937"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5027752718"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.2623,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.57202524,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"35","issue":"12","first_page":"2375","last_page":"2391"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9118000268936157,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9118000268936157,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8425856828689575},{"id":"https://openalex.org/keywords/schedule","display_name":"Schedule","score":0.6055999994277954},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.5568243861198425},{"id":"https://openalex.org/keywords/processor-scheduling","display_name":"Processor scheduling","score":0.5177813768386841},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.4765903651714325},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4669222831726074},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.3215898275375366},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.18872228264808655},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.10771340131759644}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8425856828689575},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.6055999994277954},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5568243861198425},{"id":"https://openalex.org/C2984822820","wikidata":"https://www.wikidata.org/wiki/Q1123036","display_name":"Processor scheduling","level":3,"score":0.5177813768386841},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4765903651714325},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4669222831726074},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3215898275375366},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.18872228264808655},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.10771340131759644},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2024.3466913","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tpds.2024.3466913","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1480909796","https://openalex.org/W1593916827","https://openalex.org/W2012512596","https://openalex.org/W2018348175","https://openalex.org/W2025289275","https://openalex.org/W2063123613","https://openalex.org/W2296760900","https://openalex.org/W2883830791","https://openalex.org/W2969388332","https://openalex.org/W2991040477","https://openalex.org/W3012479151","https://openalex.org/W3081168214","https://openalex.org/W3129831491","https://openalex.org/W3132107458","https://openalex.org/W3132977829","https://openalex.org/W3169483174","https://openalex.org/W3199404008","https://openalex.org/W3206832494","https://openalex.org/W4220741164","https://openalex.org/W4238759521","https://openalex.org/W4312349930","https://openalex.org/W4312910992","https://openalex.org/W4386840193"],"related_works":["https://openalex.org/W2195904091","https://openalex.org/W1809394610","https://openalex.org/W2128410848","https://openalex.org/W2101285930","https://openalex.org/W2102390841","https://openalex.org/W2118368532","https://openalex.org/W2126232624","https://openalex.org/W2434525066","https://openalex.org/W3140149227","https://openalex.org/W2130555437"],"abstract_inverted_index":{"Increasingly":[0],"complex":[1],"and":[2,18,21,61,81,120,136,154],"diverse":[3,46,84],"deep":[4],"neural":[5],"network":[6],"(DNN)":[7],"models":[8,143],"necessitate":[9],"distributing":[10],"the":[11,42,59,94,97],"execution":[12],"across":[13,108],"multiple":[14],"devices":[15],"for":[16,27,74,77,83,126],"training":[17,80,135,151],"inference":[19,82,137,158],"tasks,":[20],"also":[22],"require":[23],"carefully":[24],"planned":[25],"schedules":[26,36,53,76,100,125],"performance.":[28,138],"However,":[29],"existing":[30],"practices":[31],"often":[32,101],"rely":[33],"on":[34],"predefined":[35],"that":[37,72,96,145],"may":[38],"not":[39],"fully":[40],"exploit":[41],"benefits":[43],"of":[44],"emerging":[45],"model-aware":[47],"operator":[48,85,128],"placement":[49,86,129],"strategies.":[50,87],"Handcrafting":[51],"high-efficiency":[52],"can":[54],"be":[55],"challenging":[56],"due":[57],"to":[58,114,149,156],"large":[60],"varying":[62],"schedule":[63,121],"space.":[64],"This":[65,112],"paper":[66],"presents":[67],"Tessel,":[68],"an":[69],"automated":[70],"system":[71],"searches":[73],"efficient":[75,99],"distributed":[78],"DNN":[79,142],"To":[88],"reduce":[89],"search":[90],"costs,":[91],"Tessel":[92,131,146],"leverages":[93],"insight":[95],"most":[98],"exhibit":[102],"repetitive":[103],"pattern":[104],"(<italic":[105],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[106],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">repetend</i>)":[107],"different":[109],"data":[110],"inputs.":[111],"leads":[113],"a":[115],"two-phase":[116],"approach:":[117],"repetend":[118],"construction":[119],"completion.":[122],"By":[123],"exploring":[124],"various":[127],"strategies,":[130],"significantly":[132],"improves":[133],"both":[134],"Experiments":[139],"with":[140],"representative":[141],"demonstrate":[144],"achieves":[147],"up":[148,155],"5.5\u00d7":[150],"performance":[152],"speedup":[153],"38%":[157],"latency":[159],"reduction.":[160]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-01-17T23:10:49.606395","created_date":"2025-10-10T00:00:00"}
