{"id":"https://openalex.org/W4390683828","doi":"https://doi.org/10.1145/3636480.3637283","title":"Impact of Write-Allocate Elimination on Fujitsu A64FX","display_name":"Impact of Write-Allocate Elimination on Fujitsu A64FX","publication_year":2024,"publication_date":"2024-01-08","ids":{"openalex":"https://openalex.org/W4390683828","doi":"https://doi.org/10.1145/3636480.3637283"},"language":"en","primary_location":{"id":"doi:10.1145/3636480.3637283","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3636480.3637283","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference on High Performance Computing in Asia-Pacific Region Workshops","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102007924","display_name":"Yan Kang","orcid":"https://orcid.org/0009-0002-8718-1491"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yan Kang","raw_affiliation_strings":["The Pennsylvania State University, United States"],"affiliations":[{"raw_affiliation_string":"The Pennsylvania State University, United States","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100670911","display_name":"Sayan Ghosh","orcid":"https://orcid.org/0000-0001-8758-7657"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sayan Ghosh","raw_affiliation_strings":["Pacific Northwest National Laboratory, United States"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, United States","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007116603","display_name":"Mahmut Kandemir","orcid":"https://orcid.org/0000-0002-9940-9951"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mahmut Kandemir","raw_affiliation_strings":["The Pennsylvania State University, United States"],"affiliations":[{"raw_affiliation_string":"The Pennsylvania State University, United States","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102811479","display_name":"Andr\u00e9s M\u00e1rquez","orcid":"https://orcid.org/0000-0002-4313-1882"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andr\u00e9s Marquez","raw_affiliation_strings":["Pacific Northwest National Laboratory, United States"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, United States","institution_ids":["https://openalex.org/I142606810"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5102007924"],"corresponding_institution_ids":["https://openalex.org/I130769515"],"apc_list":null,"apc_paid":null,"fwci":0.5198,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.55393847,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"24","last_page":"35"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8521726131439209},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.569491446018219},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.5633533000946045},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.5061420798301697},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.4744994342327118},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.46913430094718933},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.456074059009552},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.43829959630966187},{"id":"https://openalex.org/keywords/cpu-cache","display_name":"CPU cache","score":0.41163578629493713},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.35324758291244507},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.16714566946029663}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8521726131439209},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.569491446018219},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.5633533000946045},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.5061420798301697},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.4744994342327118},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.46913430094718933},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.456074059009552},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.43829959630966187},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.41163578629493713},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.35324758291244507},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.16714566946029663},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3636480.3637283","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3636480.3637283","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference on High Performance Computing in Asia-Pacific Region Workshops","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.47999998927116394,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1955594754","https://openalex.org/W1961751213","https://openalex.org/W2080592089","https://openalex.org/W2131681506","https://openalex.org/W2558632230","https://openalex.org/W2897639728","https://openalex.org/W2914439491","https://openalex.org/W2921480401","https://openalex.org/W2996519492","https://openalex.org/W3097283637","https://openalex.org/W3097636320","https://openalex.org/W3099768174","https://openalex.org/W3107316479","https://openalex.org/W3180512434","https://openalex.org/W3204834182","https://openalex.org/W3205213976","https://openalex.org/W3206873289","https://openalex.org/W4253426709","https://openalex.org/W6798466079"],"related_works":["https://openalex.org/W2133682266","https://openalex.org/W2497617944","https://openalex.org/W2167303720","https://openalex.org/W1563139915","https://openalex.org/W2109715593","https://openalex.org/W2061075966","https://openalex.org/W3147501184","https://openalex.org/W2268996566","https://openalex.org/W4256652509","https://openalex.org/W2140219379"],"abstract_inverted_index":{"ARM-based":[0],"CPU":[1,127],"architectures":[2,128],"are":[3,99,158],"currently":[4],"driving":[5],"massive":[6],"disruptions":[7],"in":[8,25,30,41,70,102],"the":[9,17,31,57,85,89,125,131,137,148,185],"High":[10],"Performance":[11],"Computing":[12],"(HPC)":[13],"community.":[14],"Deployment":[15],"of":[16,51,59,84,187],"48-core":[18],"Fujitsu":[19,52],"A64FX":[20,53],"ARM":[21,43,126],"architecture":[22],"based":[23],"processor":[24],"RIKEN":[26],"\u201cFugaku\u201d":[27],"supercomputer":[28],"(#2":[29],"June":[32],"2023":[33],"Top500":[34],"list)":[35],"was":[36],"a":[37,67,114,118,141],"major":[38],"inflection":[39],"point":[40],"pushing":[42],"to":[44,55,65,75,87,161,173],"mainstream":[45],"HPC.":[46],"A":[47],"key":[48],"design":[49],"criteria":[50],"is":[54,145,171],"enhance":[56,88],"throughput":[58,90],"modern":[60],"memory-bound":[61],"applications,":[62],"which":[63,98,144],"happens":[64],"be":[66,152],"dominant":[68],"pattern":[69],"contemporary":[71],"HPC,":[72],"as":[73,180],"opposed":[74],"traditional":[76],"compute-bound":[77],"or":[78],"floating-point":[79],"intensive":[80],"science":[81,103],"workloads.":[82],"One":[83],"mechanisms":[86],"concerns":[91],"write-allocate":[92,108,188],"operations":[93,109],"(e.g.,":[94],"streaming":[95],"write":[96,115],"operations),":[97],"quite":[100],"common":[101],"applications.":[104,193],"In":[105],"particular,":[106],"eliminating":[107],"(allocate":[110],"cache":[111,142,149],"line":[112,150],"on":[113,124,190],"miss)":[116],"through":[117],"special":[119],"\u201czero":[120],"fill\u201d":[121],"instruction":[122],"available":[123],"can":[129],"improve":[130],"overall":[132],"memory":[133,138,168],"bandwidth,":[134],"by":[135],"avoiding":[136],"read":[139],"into":[140],"line,":[143],"unnecessary":[146],"since":[147],"will":[151],"written":[153],"consequently.":[154],"While":[155],"bandwidth":[156],"implications":[157],"relatively":[159],"straightforward":[160],"measure":[162],"via":[163],"synthetic":[164],"benchmarks":[165],"with":[166],"fixed-stride":[167],"accesses,":[169],"it":[170],"important":[172],"consider":[174],"irregular":[175],"memory-access":[176],"driven":[177],"scenarios":[178],"such":[179],"graph":[181],"analytics,":[182],"and":[183],"analyze":[184],"impact":[186],"elimination":[189],"diverse":[191],"data-driven":[192]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
