{"id":"https://openalex.org/W3085986100","doi":"https://doi.org/10.1109/hpcs48598.2019.9188103","title":"Open-Source Shared Memory implementation of the HPCG benchmark: analysis, improvements and evaluation on Cavium ThunderX2","display_name":"Open-Source Shared Memory implementation of the HPCG benchmark: analysis, improvements and evaluation on Cavium ThunderX2","publication_year":2019,"publication_date":"2019-07-01","ids":{"openalex":"https://openalex.org/W3085986100","doi":"https://doi.org/10.1109/hpcs48598.2019.9188103","mag":"3085986100"},"language":"en","primary_location":{"id":"doi:10.1109/hpcs48598.2019.9188103","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpcs48598.2019.9188103","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Conference on High Performance Computing &amp; Simulation (HPCS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5106497787","display_name":"Daniel Ruiz","orcid":"https://orcid.org/0000-0002-3867-0179"},"institutions":[{"id":"https://openalex.org/I2801109035","display_name":"ARM (United Kingdom)","ror":"https://ror.org/04mmhzs81","country_code":"GB","type":"company","lineage":["https://openalex.org/I2801109035"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Daniel Ruiz","raw_affiliation_strings":["Arm Ltd., Cambridge, UK"],"affiliations":[{"raw_affiliation_string":"Arm Ltd., Cambridge, UK","institution_ids":["https://openalex.org/I2801109035"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070653336","display_name":"Filippo Spiga","orcid":"https://orcid.org/0000-0003-1448-5304"},"institutions":[{"id":"https://openalex.org/I2801109035","display_name":"ARM (United Kingdom)","ror":"https://ror.org/04mmhzs81","country_code":"GB","type":"company","lineage":["https://openalex.org/I2801109035"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Filippo Spiga","raw_affiliation_strings":["Arm Ltd., Cambridge, UK"],"affiliations":[{"raw_affiliation_string":"Arm Ltd., Cambridge, UK","institution_ids":["https://openalex.org/I2801109035"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044183257","display_name":"Marc Casas","orcid":"https://orcid.org/0000-0003-4564-2093"},"institutions":[{"id":"https://openalex.org/I2799803557","display_name":"Barcelona Supercomputing Center","ror":"https://ror.org/05sd8tv96","country_code":"ES","type":"facility","lineage":["https://openalex.org/I2799803557","https://openalex.org/I9617848"]},{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Marc Casas","raw_affiliation_strings":["BSC-CNS, Barcelona, Spain"],"affiliations":[{"raw_affiliation_string":"BSC-CNS, Barcelona, Spain","institution_ids":["https://openalex.org/I9617848","https://openalex.org/I2799803557"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082933794","display_name":"Marta Garc\u00eda-Gasulla","orcid":"https://orcid.org/0000-0003-3682-9905"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]},{"id":"https://openalex.org/I2799803557","display_name":"Barcelona Supercomputing Center","ror":"https://ror.org/05sd8tv96","country_code":"ES","type":"facility","lineage":["https://openalex.org/I2799803557","https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Marta Garcia-Gasulla","raw_affiliation_strings":["BSC-CNS, Barcelona, Spain"],"affiliations":[{"raw_affiliation_string":"BSC-CNS, Barcelona, Spain","institution_ids":["https://openalex.org/I9617848","https://openalex.org/I2799803557"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046459017","display_name":"Filippo Mantovani","orcid":"https://orcid.org/0000-0003-3559-4825"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]},{"id":"https://openalex.org/I2799803557","display_name":"Barcelona Supercomputing Center","ror":"https://ror.org/05sd8tv96","country_code":"ES","type":"facility","lineage":["https://openalex.org/I2799803557","https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Filippo Mantovani","raw_affiliation_strings":["BSC-CNS, Barcelona, Spain"],"affiliations":[{"raw_affiliation_string":"BSC-CNS, Barcelona, Spain","institution_ids":["https://openalex.org/I9617848","https://openalex.org/I2799803557"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5106497787"],"corresponding_institution_ids":["https://openalex.org/I2801109035"],"apc_list":null,"apc_paid":null,"fwci":0.9631,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.75723976,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"312","issue":null,"first_page":"225","last_page":"232"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10339","display_name":"Advanced Numerical Methods in Computational Mathematics","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7849660515785217},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7433410882949829},{"id":"https://openalex.org/keywords/open-source","display_name":"Open source","score":0.5465167164802551},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4284132122993469},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.38990628719329834},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2773066759109497},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.13206464052200317}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7849660515785217},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7433410882949829},{"id":"https://openalex.org/C3018397939","wikidata":"https://www.wikidata.org/wiki/Q3644502","display_name":"Open source","level":3,"score":0.5465167164802551},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4284132122993469},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.38990628719329834},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2773066759109497},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.13206464052200317},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpcs48598.2019.9188103","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpcs48598.2019.9188103","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Conference on High Performance Computing &amp; Simulation (HPCS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.47999998927116394,"display_name":"Life in Land","id":"https://metadata.un.org/sdg/15"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W59438603","https://openalex.org/W105754624","https://openalex.org/W309890564","https://openalex.org/W821177523","https://openalex.org/W858404628","https://openalex.org/W1252105715","https://openalex.org/W1495954130","https://openalex.org/W1506342804","https://openalex.org/W1656664476","https://openalex.org/W1962931680","https://openalex.org/W2009196736","https://openalex.org/W2100725958","https://openalex.org/W2111784516","https://openalex.org/W2318393100","https://openalex.org/W2530848289","https://openalex.org/W2566272869","https://openalex.org/W2587647010","https://openalex.org/W2613264175","https://openalex.org/W2623993198","https://openalex.org/W2750064372","https://openalex.org/W2753129172","https://openalex.org/W2759197764","https://openalex.org/W2799373657","https://openalex.org/W2913716454","https://openalex.org/W3123542955","https://openalex.org/W4302771278","https://openalex.org/W6623297523","https://openalex.org/W6623627250","https://openalex.org/W6629678226","https://openalex.org/W6652573353","https://openalex.org/W6731443796"],"related_works":["https://openalex.org/W1485630101","https://openalex.org/W2498017833","https://openalex.org/W1604898313","https://openalex.org/W2010011028","https://openalex.org/W2081245617","https://openalex.org/W2391655055","https://openalex.org/W3088526462","https://openalex.org/W1997145140","https://openalex.org/W2034384303","https://openalex.org/W4310292586"],"abstract_inverted_index":{"The":[0],"High":[1,18],"Performance":[2,19],"Conjugate":[3],"Gradient":[4],"(HPCG)":[5],"benchmark":[6,10,40,72],"complements":[7],"the":[8,12,57,66,70,93,98,136,142,146],"LINPACK":[9],"in":[11,80,107],"performance":[13],"evaluation":[14],"coverage":[15],"of":[16,65,69,101,145,162],"large":[17],"Computing":[20],"(HPC)":[21],"systems.":[22],"Due":[23,96],"to":[24,97,135,156],"its":[25,50],"lower":[26],"arithmetic":[27],"intensity":[28],"and":[29,43,85,104],"higher":[30],"memory":[31,45,77],"pressure,":[32],"HPCG":[33,71,113,148],"is":[34,73],"recognized":[35],"as":[36,129],"a":[37,62,116,130],"more":[38],"representative":[39],"for":[41,92],"data-center":[42],"irregular":[44],"access":[46],"pattern":[47],"workloads,":[48],"therefore":[49],"popularity":[51],"has":[52,149],"been":[53,150],"steadily":[54],"raising":[55],"within":[56],"HPC":[58,118,164],"community.":[59,165],"As":[60],"only":[61],"small":[63],"fraction":[64],"reference":[67],"version":[68,114],"parallelized":[74],"with":[75,139],"shared":[76],"techniques":[78],"(OpenMP),":[79],"this":[81,140],"paper":[82],"we":[83,109],"introduce":[84],"evaluate":[86,110],"in-depth":[87],"two":[88],"OpenMP":[89],"parallelization":[90],"strategies":[91],"Gauss-Seidel":[94],"preconditioner.":[95],"increasing":[99],"attractiveness":[100],"Arm":[102,105],"architecture":[103],"ecosystem":[106],"HPC,":[108],"our":[111,127],"modified":[112,147],"on":[115,121,154],"state-of-the-art":[117],"system":[119],"based":[120],"Cavium":[122],"ThunderX2":[123],"SoC.":[124],"We":[125],"consider":[126],"work":[128],"broader":[131],"contribution":[132],"not":[133],"exclusively":[134],"Arm:":[137],"along":[138],"paper,":[141],"source":[143],"code":[144],"made":[151],"publicly":[152],"available":[153],"GitLab":[155],"enable":[157],"further":[158],"optimizations":[159],"at":[160],"benefit":[161],"all":[163]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
