{"id":"https://openalex.org/W7119536258","doi":"https://doi.org/10.1145/3773656.3773667","title":"PRISM: Profiling-Free Symbolic Memory-Driven Strategy Planner for Large DNN Model Training","display_name":"PRISM: Profiling-Free Symbolic Memory-Driven Strategy Planner for Large DNN Model Training","publication_year":2026,"publication_date":"2026-01-09","ids":{"openalex":"https://openalex.org/W7119536258","doi":"https://doi.org/10.1145/3773656.3773667"},"language":"en","primary_location":{"id":"doi:10.1145/3773656.3773667","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3773656.3773667","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Supercomputing Asia and International Conference on High Performance Computing in Asia Pacific Region","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3773656.3773667","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122316047","display_name":"Ruiwen Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I4210123571","display_name":"Huawei Technologies (France)","ror":"https://ror.org/02rbzf697","country_code":"FR","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210123571"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Ruiwen Wang","raw_affiliation_strings":["Sorbonne University, Paris, France and Distributed and Parallel Technologies Laboratory, Huawei Technologies, Boulogne-Billancourt, France"],"raw_orcid":"https://orcid.org/0009-0000-6709-5970","affiliations":[{"raw_affiliation_string":"Sorbonne University, Paris, France and Distributed and Parallel Technologies Laboratory, Huawei Technologies, Boulogne-Billancourt, France","institution_ids":["https://openalex.org/I39804081","https://openalex.org/I4210123571"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122303306","display_name":"Philippe Fang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210123571","display_name":"Huawei Technologies (France)","ror":"https://ror.org/02rbzf697","country_code":"FR","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210123571"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Philippe Fang","raw_affiliation_strings":["Distributed and Parallel Technologies Laboratory, Huawei Technologies, Boulogne-Billancourt, France"],"raw_orcid":"https://orcid.org/0009-0003-6981-5355","affiliations":[{"raw_affiliation_string":"Distributed and Parallel Technologies Laboratory, Huawei Technologies, Boulogne-Billancourt, France","institution_ids":["https://openalex.org/I4210123571"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Chong Li","orcid":"https://orcid.org/0000-0002-4160-7170"},"institutions":[{"id":"https://openalex.org/I4210123571","display_name":"Huawei Technologies (France)","ror":"https://ror.org/02rbzf697","country_code":"FR","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210123571"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Chong Li","raw_affiliation_strings":["Distributed and Parallel Technologies Laboratory, Huawei Technologies, Boulogne-Billancourt, France"],"raw_orcid":"https://orcid.org/0000-0002-4160-7170","affiliations":[{"raw_affiliation_string":"Distributed and Parallel Technologies Laboratory, Huawei Technologies, Boulogne-Billancourt, France","institution_ids":["https://openalex.org/I4210123571"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080257325","display_name":"Thibaut Tachon","orcid":"https://orcid.org/0000-0003-3264-5535"},"institutions":[{"id":"https://openalex.org/I4210123571","display_name":"Huawei Technologies (France)","ror":"https://ror.org/02rbzf697","country_code":"FR","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210123571"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Thibaut Tachon","raw_affiliation_strings":["Distributed and Parallel Technologies Laboratory, Huawei Technologies, Boulogne-Billancourt, France"],"raw_orcid":"https://orcid.org/0000-0003-3264-5535","affiliations":[{"raw_affiliation_string":"Distributed and Parallel Technologies Laboratory, Huawei Technologies, Boulogne-Billancourt, France","institution_ids":["https://openalex.org/I4210123571"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019249875","display_name":"Raja Appuswamy","orcid":"https://orcid.org/0000-0001-5887-4091"},"institutions":[{"id":"https://openalex.org/I1902872","display_name":"EURECOM","ror":"https://ror.org/00sse7z02","country_code":"FR","type":"education","lineage":["https://openalex.org/I1902872","https://openalex.org/I205703379"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Raja Appuswamy","raw_affiliation_strings":["Institut Eur\u00e9com, Biot, France"],"raw_orcid":"https://orcid.org/0000-0001-5887-4091","affiliations":[{"raw_affiliation_string":"Institut Eur\u00e9com, Biot, France","institution_ids":["https://openalex.org/I1902872"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03754212,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"308","last_page":"319"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.45179998874664307,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.45179998874664307,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.10779999941587448,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.08309999853372574,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.476500004529953},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.415800005197525},{"id":"https://openalex.org/keywords/flops","display_name":"FLOPS","score":0.3856000006198883},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.3824000060558319},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.3700000047683716},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.357699990272522}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7901999950408936},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.476500004529953},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4442000091075897},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.415800005197525},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.3856000006198883},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.3824000060558319},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.37689998745918274},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.3700000047683716},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.357699990272522},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.33489999175071716},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.31119999289512634},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3066999912261963},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.30230000615119934},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.2687999904155731},{"id":"https://openalex.org/C67666897","wikidata":"https://www.wikidata.org/wiki/Q165896","display_name":"Prism","level":2,"score":0.260699987411499},{"id":"https://openalex.org/C2781357197","wikidata":"https://www.wikidata.org/wiki/Q5757597","display_name":"High memory","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.2513999938964844}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3773656.3773667","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3773656.3773667","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Supercomputing Asia and International Conference on High Performance Computing in Asia Pacific Region","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-05564696v1","is_oa":true,"landing_page_url":"https://hal.science/hal-05564696","pdf_url":"https://hal.science/hal-05564696v1/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"SCA/HPCAsia 2026: Supercomputing Asia and International Conference on High Performance Computing in Asia Pacific Region, Jan 2026, Osaka, Japan. pp.308 - 319, &#x27E8;10.1145/3773656.3773667&#x27E9;","raw_type":"Conference papers"},{"id":"pmh:oai:fr.eurecom:8486","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4377196942","display_name":"Graduate School and Research Center in Digital Science (EURECOM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1902872","host_organization_name":"EURECOM","host_organization_lineage":["https://openalex.org/I1902872"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"SCA/HPC Asia 2026, Supercomputing Asia / International Conference on High Performance Computing in the Asia-Pacific Region, 26-29 January 2026, Osaka, Japan","raw_type":"Conference"}],"best_oa_location":{"id":"doi:10.1145/3773656.3773667","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3773656.3773667","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Supercomputing Asia and International Conference on High Performance Computing in Asia Pacific Region","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.5302796959877014,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W2969388332","https://openalex.org/W3204998121","https://openalex.org/W4310282800","https://openalex.org/W4389518760","https://openalex.org/W4399452094"],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"growth":[2],"of":[3,72],"large-scale":[4,40],"deep":[5],"neural":[6],"networks":[7],"(DNNs)":[8],"has":[9],"introduced":[10],"severe":[11],"memory":[12,64,118,131],"and":[13,38,75,91,99,133,143],"performance":[14],"bottlenecks":[15],"during":[16],"distributed":[17],"training.":[18,58],"Existing":[19],"automated":[20],"planners":[21],"for":[22,55],"parallelization":[23],"strategies":[24,115],"often":[25],"rely":[26],"heavily":[27],"on":[28],"profiling":[29],"or":[30],"empirical":[31],"tuning,":[32],"which":[33],"significantly":[34],"increases":[35],"engineering":[36],"cost":[37,65],"wastes":[39],"cluster":[41],"resources.":[42],"In":[43],"this":[44],"work,":[45],"we":[46],"present":[47],"PRISM,":[48],"a":[49,61,78],"profiling-free,":[50],"symbolic":[51,63],"memory-driven":[52],"strategy":[53,104],"planner":[54],"large":[56,124],"DNN":[57],"PRISM":[59,110,128],"introduces":[60],"unified":[62],"model":[66,80],"that":[67,127],"captures":[68],"the":[69],"layered":[70],"structure":[71],"modern":[73],"architectures":[74],"integrates":[76],"with":[77],"communication":[79,144],"to":[81],"evaluate":[82],"trade-offs":[83],"across":[84,122],"data,":[85],"tensor,":[86],"pipeline,":[87,89],"virtual":[88],"expert,":[90],"sequence":[92],"parallelism,":[93],"as":[94,96,106],"well":[95],"activation":[97],"recomputation":[98],"optimizer":[100],"sharding.":[101],"By":[102],"formulating":[103],"selection":[105],"an":[107],"optimization":[108],"problem,":[109],"identifies":[111],"globally":[112],"optimal":[113],"parallel":[114],"under":[116],"device":[117],"budgets.":[119],"Our":[120],"evaluation":[121],"representative":[123],"models":[125],"demonstrates":[126],"achieves":[129],"accurate":[130],"prediction":[132],"substantial":[134],"improvements":[135],"in":[136],"Model":[137],"FLOPs":[138],"Utilization":[139],"(MFU),":[140],"reducing":[141],"bubble":[142],"overheads":[145],"without":[146],"costly":[147],"profiling.":[148]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-01-09T00:00:00"}
