{"id":"https://openalex.org/W4319067155","doi":"https://doi.org/10.1145/3581576.3581618","title":"Are we ready for broader adoption of ARM in the HPC community: Performance and Energy Efficiency Analysis of Benchmarks and Applications Executed on High-End ARM Systems","display_name":"Are we ready for broader adoption of ARM in the HPC community: Performance and Energy Efficiency Analysis of Benchmarks and Applications Executed on High-End ARM Systems","publication_year":2023,"publication_date":"2023-02-03","ids":{"openalex":"https://openalex.org/W4319067155","doi":"https://doi.org/10.1145/3581576.3581618"},"language":"en","primary_location":{"id":"doi:10.1145/3581576.3581618","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581576.3581618","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the HPC Asia 2023 Workshops","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059317345","display_name":"Nikolay A. Simakov","orcid":"https://orcid.org/0000-0001-6131-5979"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Nikolay A. Simakov","raw_affiliation_strings":["Center for Computational Research, SUNY University at Buffalo, United States"],"raw_orcid":"https://orcid.org/0000-0001-6131-5979","affiliations":[{"raw_affiliation_string":"Center for Computational Research, SUNY University at Buffalo, United States","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010580969","display_name":"Robert L. DeLeon","orcid":"https://orcid.org/0000-0003-1417-8363"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Robert L. Deleon","raw_affiliation_strings":["Center for Computational Research, Center for Computational Research, SUNY University at Buffalo, United States"],"raw_orcid":"https://orcid.org/0000-0003-1417-8363","affiliations":[{"raw_affiliation_string":"Center for Computational Research, Center for Computational Research, SUNY University at Buffalo, United States","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087331881","display_name":"Joseph P. White","orcid":"https://orcid.org/0000-0003-0078-5330"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Joseph P. White","raw_affiliation_strings":["Center for Computational Research, SUNY University at Buffalo, United States"],"raw_orcid":"https://orcid.org/0000-0003-0078-5330","affiliations":[{"raw_affiliation_string":"Center for Computational Research, SUNY University at Buffalo, United States","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014096956","display_name":"Matthew D. Jones","orcid":"https://orcid.org/0000-0001-7293-226X"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Matthew D. Jones","raw_affiliation_strings":["Center for Computational Research, SUNY University at Buffalo, United States"],"raw_orcid":"https://orcid.org/0000-0001-7293-226X","affiliations":[{"raw_affiliation_string":"Center for Computational Research, SUNY University at Buffalo, United States","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086695342","display_name":"Thomas R. Furlani","orcid":"https://orcid.org/0000-0002-4683-0814"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thomas R. Furlani","raw_affiliation_strings":["Center for Computational Research, SUNY University at Buffalo, United States"],"raw_orcid":"https://orcid.org/0000-0002-4683-0814","affiliations":[{"raw_affiliation_string":"Center for Computational Research, SUNY University at Buffalo, United States","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056470242","display_name":"Eva Siegmann","orcid":"https://orcid.org/0000-0003-1216-1576"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eva Siegmann","raw_affiliation_strings":["Institute for Advanced Computational Science, Stony Brook University, United States"],"raw_orcid":"https://orcid.org/0000-0003-1216-1576","affiliations":[{"raw_affiliation_string":"Institute for Advanced Computational Science, Stony Brook University, United States","institution_ids":["https://openalex.org/I59553526"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010174060","display_name":"Robert J. Harrison","orcid":"https://orcid.org/0000-0002-8777-7466"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Robert J. Harrison","raw_affiliation_strings":["Institute for Advanced Computational Science, Stony Brook University, United States"],"raw_orcid":"https://orcid.org/0000-0002-8777-7466","affiliations":[{"raw_affiliation_string":"Institute for Advanced Computational Science, Stony Brook University, United States","institution_ids":["https://openalex.org/I59553526"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5059317345"],"corresponding_institution_ids":["https://openalex.org/I63190737"],"apc_list":null,"apc_paid":null,"fwci":4.1894,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.94651021,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"78","last_page":"86"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/x86","display_name":"x86","score":0.9195021390914917},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7709670066833496},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.6668689250946045},{"id":"https://openalex.org/keywords/porting","display_name":"Porting","score":0.6226818561553955},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.616544246673584},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.5392322540283203},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.49263960123062134},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4666310250759125},{"id":"https://openalex.org/keywords/arm-architecture","display_name":"ARM architecture","score":0.4551025927066803},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.32008177042007446}],"concepts":[{"id":"https://openalex.org/C170723468","wikidata":"https://www.wikidata.org/wiki/Q182933","display_name":"x86","level":3,"score":0.9195021390914917},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7709670066833496},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.6668689250946045},{"id":"https://openalex.org/C106251023","wikidata":"https://www.wikidata.org/wiki/Q851989","display_name":"Porting","level":3,"score":0.6226818561553955},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.616544246673584},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.5392322540283203},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.49263960123062134},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4666310250759125},{"id":"https://openalex.org/C26771161","wikidata":"https://www.wikidata.org/wiki/Q16980","display_name":"ARM architecture","level":2,"score":0.4551025927066803},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.32008177042007446},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581576.3581618","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581576.3581618","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the HPC Asia 2023 Workshops","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8700000047683716,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G2764879464","display_name":null,"funder_award_id":"OAC 2137603 and OAC 1927880","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1895692106","https://openalex.org/W2096339900","https://openalex.org/W2115110170","https://openalex.org/W2121047119","https://openalex.org/W2151316504","https://openalex.org/W2507549455","https://openalex.org/W2913716454","https://openalex.org/W3020638658","https://openalex.org/W3035762603","https://openalex.org/W3092054218","https://openalex.org/W3103156673","https://openalex.org/W3104098743","https://openalex.org/W3186737188","https://openalex.org/W4296594301"],"related_works":["https://openalex.org/W2386329253","https://openalex.org/W2387474457","https://openalex.org/W2384479030","https://openalex.org/W3195889798","https://openalex.org/W2376033584","https://openalex.org/W2973892509","https://openalex.org/W2352844827","https://openalex.org/W2374888813","https://openalex.org/W2160463718","https://openalex.org/W3095952171"],"abstract_inverted_index":{"A":[0],"set":[1],"of":[2,51,75,82,94,113,165,170],"benchmarks,":[3],"including":[4],"numerical":[5],"libraries":[6],"and":[7,27,33,64,137,160,178,209,223],"real-world":[8],"scientific":[9],"applications,":[10],"were":[11],"run":[12],"on":[13,89],"several":[14],"modern":[15],"ARM":[16,99,142,181,228],"systems":[17,31,204],"(Amazon":[18],"Graviton":[19],"3/2,":[20],"Futjutsu":[21],"A64FX,":[22],"Ampere":[23],"Altra,":[24],"Thunder":[25],"X2)":[26],"compared":[28],"to":[29,38,153,156,187],"x86":[30,158,166,193],"(Intel":[32],"AMD)":[34],"as":[35,37,235],"well":[36],"hybrid":[39],"Intel":[40],"x86/NVIDIA":[41],"GPUs":[42],"systems.":[43],"For":[44],"benchmarking":[45],"automation,":[46],"the":[47,79,90,95,202,206,210,215],"application":[48,68],"kernel":[49,69],"module":[50,70],"XDMoD":[52,55],"was":[53,147,182,200],"used.":[54],"is":[56],"a":[57,111,232,236],"comprehensive":[58],"suite":[59],"for":[60,107],"HPC":[61,76,118,238],"resource":[62],"utilization":[63],"performance":[65,73,199],"monitoring.":[66],"The":[67,104],"enables":[71],"continuous":[72],"monitoring":[74],"resources":[77],"through":[78],"regular":[80],"execution":[81,179],"user":[83],"applications.":[84],"It":[85],"has":[86],"been":[87],"used":[88,106],"Ookami":[91],"system":[92,239],"(one":[93],"first":[96],"USA-based":[97],"Fujitsu":[98],"A64FX":[100],"SVE":[101],"512":[102],"systems).":[103],"applications":[105],"this":[108],"study":[109],"span":[110],"variety":[112],"computational":[114],"paradigms:":[115],"HPCC":[116],"(several":[117],"benchmarks),":[119],"NWChem":[120],"(ab":[121],"initio":[122],"chemistry),":[123],"Open":[124],"Foam(partial":[125],"differential":[126],"equation":[127],"solver),":[128],"GROMACS":[129],"(biomolecular":[130],"simulation),":[131],"AI":[132],"Benchmark":[133],"Alpha":[134],"(AI":[135],"benchmark)":[136],"Enzo":[138],"(adaptive":[139],"mesh":[140],"refinement).":[141],"performance,":[143,222],"while":[144],"generally":[145],"slower,":[146],"nonetheless":[148],"shown":[149,183],"in":[150,184],"many":[151],"cases":[152,186,196],"be":[154,188],"comparable":[155,221],"current":[157,226],"counterparts":[159],"often":[161],"outperforms":[162],"previous":[163],"generations":[164],"CPUs.":[167],"In":[168,195],"terms":[169],"energy":[171,190,212],"efficiency,":[172],"which":[173],"considers":[174],"both":[175],"power":[176],"consumption":[177],"time,":[180],"most":[185],"more":[189],"efficient":[191],"than":[192],"processors.":[194],"where":[197],"GPU":[198,203],"tested,":[201],"showed":[205],"fastest":[207],"speed":[208],"highest":[211],"efficiency.":[213],"Given":[214],"high":[216],"core":[217],"count":[218],"per":[219],"node,":[220],"competitive":[224],"pricing,":[225],"high-end":[227],"CPUs":[229],"are":[230],"already":[231],"valid":[233],"choice":[234],"primary":[237],"processor.":[240]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
