{"id":"https://openalex.org/W3158454049","doi":"https://doi.org/10.1109/coolchips52128.2021.9410320","title":"Power/Performance/Area Evaluations for Next-Generation HPC Processors using the A64FX Chip","display_name":"Power/Performance/Area Evaluations for Next-Generation HPC Processors using the A64FX Chip","publication_year":2021,"publication_date":"2021-04-14","ids":{"openalex":"https://openalex.org/W3158454049","doi":"https://doi.org/10.1109/coolchips52128.2021.9410320","mag":"3158454049"},"language":"en","primary_location":{"id":"doi:10.1109/coolchips52128.2021.9410320","is_oa":false,"landing_page_url":"https://doi.org/10.1109/coolchips52128.2021.9410320","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Symposium in Low-Power and High-Speed Chips (COOL CHIPS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087319091","display_name":"Eishi Arima","orcid":"https://orcid.org/0009-0002-7043-4288"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Eishi Arima","raw_affiliation_strings":["The University of Tokyo, Tokyo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102814672","display_name":"Yuetsu Kodama","orcid":"https://orcid.org/0000-0001-5787-0363"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yuetsu Kodama","raw_affiliation_strings":["RIKEN Center for Computational Science, Kobe, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science, Kobe, Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085261318","display_name":"Tetsuya Odajima","orcid":null},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tetsuya Odajima","raw_affiliation_strings":["RIKEN Center for Computational Science, Kobe, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science, Kobe, Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079973660","display_name":"Miwako Tsuji","orcid":"https://orcid.org/0000-0003-4709-1969"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Miwako Tsuji","raw_affiliation_strings":["RIKEN Center for Computational Science, Kobe, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science, Kobe, Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040254066","display_name":"Mitsuhisa Sato","orcid":"https://orcid.org/0000-0003-0543-7116"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Mitsuhisa Sato","raw_affiliation_strings":["RIKEN Center for Computational Science, Kobe, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science, Kobe, Japan","institution_ids":["https://openalex.org/I4210129730"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.3036,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.92189893,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.8772079944610596},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8349317312240601},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7789918184280396},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.762792706489563},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5686349868774414},{"id":"https://openalex.org/keywords/flops","display_name":"FLOPS","score":0.5641805529594421},{"id":"https://openalex.org/keywords/microprocessor","display_name":"Microprocessor","score":0.5306944847106934},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.5129146575927734},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.4773269295692444},{"id":"https://openalex.org/keywords/chip","display_name":"Chip","score":0.45364734530448914},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.4498632252216339},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.44491615891456604},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4325808882713318},{"id":"https://openalex.org/keywords/system-on-a-chip","display_name":"System on a chip","score":0.42532992362976074},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.12124711275100708},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.08669230341911316}],"concepts":[{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.8772079944610596},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8349317312240601},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7789918184280396},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.762792706489563},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5686349868774414},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.5641805529594421},{"id":"https://openalex.org/C2780728072","wikidata":"https://www.wikidata.org/wiki/Q5297","display_name":"Microprocessor","level":2,"score":0.5306944847106934},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.5129146575927734},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.4773269295692444},{"id":"https://openalex.org/C165005293","wikidata":"https://www.wikidata.org/wiki/Q1074500","display_name":"Chip","level":2,"score":0.45364734530448914},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.4498632252216339},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.44491615891456604},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4325808882713318},{"id":"https://openalex.org/C118021083","wikidata":"https://www.wikidata.org/wiki/Q610398","display_name":"System on a chip","level":2,"score":0.42532992362976074},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.12124711275100708},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.08669230341911316},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/coolchips52128.2021.9410320","is_oa":false,"landing_page_url":"https://doi.org/10.1109/coolchips52128.2021.9410320","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Symposium in Low-Power and High-Speed Chips (COOL CHIPS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.8100000023841858}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320912","display_name":"Ministry of Education, Culture, Sports, Science and Technology","ror":"https://ror.org/048rj2z13"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W83535271","https://openalex.org/W1976494130","https://openalex.org/W2026981025","https://openalex.org/W2076652033","https://openalex.org/W2106562406","https://openalex.org/W2147657366","https://openalex.org/W2157070686","https://openalex.org/W2170382128","https://openalex.org/W2201475267","https://openalex.org/W2325538041","https://openalex.org/W2561995440","https://openalex.org/W2735029112","https://openalex.org/W2758250355","https://openalex.org/W2900387938","https://openalex.org/W2996519492","https://openalex.org/W3037152957","https://openalex.org/W3091948764","https://openalex.org/W3101195351","https://openalex.org/W3128486141","https://openalex.org/W3132840842","https://openalex.org/W4234059337","https://openalex.org/W4249553981","https://openalex.org/W6687496080","https://openalex.org/W6730455766","https://openalex.org/W6790072633","https://openalex.org/W6790589905"],"related_works":["https://openalex.org/W1979781211","https://openalex.org/W2038328339","https://openalex.org/W401777774","https://openalex.org/W2148790774","https://openalex.org/W1964549096","https://openalex.org/W56807374","https://openalex.org/W583741936","https://openalex.org/W3158454049","https://openalex.org/W2364447129","https://openalex.org/W1487278226"],"abstract_inverted_index":{"Future":[0],"HPC":[1,167],"systems,":[2],"including":[3],"post-exascale":[4],"supercomputers,":[5],"will":[6,136],"face":[7],"severe":[8],"problems":[9],"such":[10],"as":[11],"the":[12,18,33,46,55,73,83,88,95,105,113,143,158,162],"slowing-down":[13],"of":[14,20,49,62,115,165],"Moore's":[15],"law":[16],"and":[17,58,67,85,90,119,152],"limitation":[19],"power":[21,89],"supply.":[22],"To":[23],"achieve":[24],"desired":[25],"system":[26,145],"performance":[27],"improvement":[28,108],"while":[29],"counteracting":[30],"these":[31],"issues,":[32],"hardware":[34],"design":[35],"optimization":[36],"is":[37],"a":[38,59],"key":[39],"factor.":[40],"In":[41],"this":[42],"paper,":[43],"we":[44,76,102,160],"investigate":[45,103],"future":[47,163],"directions":[48,164],"SIMD-based":[50,166],"processor":[51],"architectures":[52],"by":[53,93,111],"using":[54],"A64FX":[56,74],"chip":[57],"customized":[60],"version":[61],"power/performance/area":[63],"simulators,":[64,84],"i.e.,":[65],"Gem5":[66],"McPAT.":[68],"More":[69],"specifically,":[70],"based":[71],"on":[72,148,157],"chip,":[75],"firstly":[77],"customize":[78],"various":[79],"energy":[80],"parameters":[81],"in":[82],"then":[86],"evaluate":[87],"area":[91],"reductions":[92],"scaling":[94,112,135],"technology":[96],"node":[97],"down":[98],"to":[99,142],"3nm.":[100],"Moreover,":[101],"also":[104],"achievable":[106],"FLOPS":[107,140],"at":[109],"3nm":[110],"number":[114],"cores,":[116],"SIMD":[117],"width,":[118],"FP":[120,153],"pipeline":[121],"width":[122,134],"under":[123],"power/area":[124],"constraints.":[125],"The":[126],"evaluation":[127],"result":[128],"indicates":[129],"that":[130],"no":[131],"further":[132],"SIMD/pipeline":[133],"help":[137],"with":[138],"improving":[139],"due":[141],"memory":[144],"bottleneck,":[146],"especially":[147],"L1":[149],"data":[150],"caches":[151],"register":[154],"files.":[155],"Based":[156],"observation,":[159],"discuss":[161],"processors.":[168]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
