{"id":"https://openalex.org/W4416146692","doi":"https://doi.org/10.1145/3712285.3759877","title":"Scaling the memory wall using mixed-precision - HPG-MxP on an exascale machine","display_name":"Scaling the memory wall using mixed-precision - HPG-MxP on an exascale machine","publication_year":2025,"publication_date":"2025-11-12","ids":{"openalex":"https://openalex.org/W4416146692","doi":"https://doi.org/10.1145/3712285.3759877"},"language":null,"primary_location":{"id":"doi:10.1145/3712285.3759877","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712285.3759877","pdf_url":null,"source":null,"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3712285.3759877","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051291589","display_name":"Aditya Kashi","orcid":"https://orcid.org/0000-0003-2589-3792"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Aditya Kashi","raw_affiliation_strings":["National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA"],"affiliations":[{"raw_affiliation_string":"National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028017125","display_name":"Nicholson Koukpaizan","orcid":"https://orcid.org/0009-0008-5384-9741"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicholson Koukpaizan","raw_affiliation_strings":["National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA"],"affiliations":[{"raw_affiliation_string":"National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058248684","display_name":"Hao Lu","orcid":"https://orcid.org/0000-0001-8941-870X"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hao Lu","raw_affiliation_strings":["National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA"],"affiliations":[{"raw_affiliation_string":"National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012951247","display_name":"Michael A. Matheson","orcid":"https://orcid.org/0000-0003-1512-5255"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Matheson","raw_affiliation_strings":["National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, USA"],"affiliations":[{"raw_affiliation_string":"National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014538652","display_name":"Sarp Oral","orcid":"https://orcid.org/0000-0001-8745-7078"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sarp Oral","raw_affiliation_strings":["National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA"],"affiliations":[{"raw_affiliation_string":"National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101916963","display_name":"Feiyi Wang","orcid":"https://orcid.org/0000-0002-0099-1559"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Feiyi Wang","raw_affiliation_strings":["National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA"],"affiliations":[{"raw_affiliation_string":"National Center for Computational Sciences, Oak Ridge National Laboratory (ORNL), Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5051291589"],"corresponding_institution_ids":["https://openalex.org/I1289243028"],"apc_list":null,"apc_paid":null,"fwci":3.0167,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.93109893,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"281","last_page":"297"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.33219999074935913,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.33219999074935913,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.10729999840259552,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.10260000079870224,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.5097000002861023},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.4708999991416931},{"id":"https://openalex.org/keywords/exascale-computing","display_name":"Exascale computing","score":0.46309998631477356},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.41600000858306885},{"id":"https://openalex.org/keywords/applications-of-artificial-intelligence","display_name":"Applications of artificial intelligence","score":0.3837999999523163},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.3758000135421753},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.32580000162124634}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7540000081062317},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.5097000002861023},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4952000081539154},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4758000075817108},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.4708999991416931},{"id":"https://openalex.org/C2778837361","wikidata":"https://www.wikidata.org/wiki/Q2450880","display_name":"Exascale computing","level":3,"score":0.46309998631477356},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.41600000858306885},{"id":"https://openalex.org/C157170001","wikidata":"https://www.wikidata.org/wiki/Q4781507","display_name":"Applications of artificial intelligence","level":2,"score":0.3837999999523163},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.3758000135421753},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3666999936103821},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.32580000162124634},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3197000026702881},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.30379998683929443},{"id":"https://openalex.org/C23375383","wikidata":"https://www.wikidata.org/wiki/Q176499","display_name":"Unconventional computing","level":2,"score":0.30059999227523804},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.29330000281333923},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2897000014781952},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.28380000591278076},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2824999988079071},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C2994168587","wikidata":"https://www.wikidata.org/wiki/Q5295","display_name":"Random access memory","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C123593499","wikidata":"https://www.wikidata.org/wiki/Q6008583","display_name":"In-Memory Processing","level":5,"score":0.2646999955177307},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.259799987077713}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3712285.3759877","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712285.3759877","pdf_url":null,"source":null,"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3712285.3759877","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3712285.3759877","pdf_url":null,"source":null,"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1133087070","https://openalex.org/W1506342804","https://openalex.org/W1572171512","https://openalex.org/W1982358758","https://openalex.org/W1994182141","https://openalex.org/W2074976694","https://openalex.org/W2087891564","https://openalex.org/W2100061495","https://openalex.org/W2111593426","https://openalex.org/W2128116722","https://openalex.org/W2128853364","https://openalex.org/W2140153041","https://openalex.org/W2151317657","https://openalex.org/W3038558128","https://openalex.org/W3177284785","https://openalex.org/W4233132415","https://openalex.org/W4318603194","https://openalex.org/W4392593298","https://openalex.org/W4404169347","https://openalex.org/W4407792922"],"related_works":[],"abstract_inverted_index":{"Mixed-precision":[0],"algorithms":[1,70],"have":[2,38],"been":[3],"proposed":[4],"as":[5,48],"a":[6,51,72],"way":[7],"for":[8,19],"scientific":[9,54],"computing":[10,27],"to":[11],"benefit":[12],"from":[13,67],"some":[14],"of":[15,53],"the":[16,64],"gains":[17],"seen":[18,39],"artificial":[20],"intelligence":[21],"(AI)":[22],"on":[23,71],"recent":[24],"high":[25],"performance":[26],"(HPC)":[28],"platforms.":[29],"A":[30],"few":[31],"applications":[32,56],"dominated":[33],"by":[34,42],"dense":[35],"matrix":[36],"operations":[37],"substantial":[40],"speedups":[41],"utilizing":[43],"low":[44],"precision":[45],"formats":[46],"such":[47],"FP16.":[49],"However,":[50],"majority":[52],"simulation":[55],"are":[57],"memory":[58],"bandwidth":[59],"limited.":[60],"Beyond":[61],"preliminary":[62],"studies,":[63],"practical":[65],"gain":[66],"using":[68],"mixed-precision":[69],"given":[73],"HPC":[74],"system":[75],"is":[76],"largely":[77],"unclear.":[78]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-11-12T00:00:00"}
