{"id":"https://openalex.org/W3005380678","doi":"https://doi.org/10.1007/978-3-030-50743-5_21","title":"Understanding HPC Benchmark Performance on Intel Broadwell and\u00a0Cascade Lake Processors","display_name":"Understanding HPC Benchmark Performance on Intel Broadwell and\u00a0Cascade Lake Processors","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3005380678","doi":"https://doi.org/10.1007/978-3-030-50743-5_21","mag":"3005380678"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-030-50743-5_21","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-50743-5_21","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-030-50743-5_21.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-030-50743-5_21.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058357790","display_name":"Christie Louis Alappat","orcid":"https://orcid.org/0000-0003-4548-8727"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Christie L. Alappat","raw_affiliation_strings":["Erlangen Regional Computing Center (RRZE), 91058, Erlangen, Germany"],"affiliations":[{"raw_affiliation_string":"Erlangen Regional Computing Center (RRZE), 91058, Erlangen, Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058862418","display_name":"Johannes Hofmann","orcid":"https://orcid.org/0000-0002-0667-2452"},"institutions":[{"id":"https://openalex.org/I181369854","display_name":"Friedrich-Alexander-Universit\u00e4t Erlangen-N\u00fcrnberg","ror":"https://ror.org/00f7hpc57","country_code":"DE","type":"education","lineage":["https://openalex.org/I181369854"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Johannes Hofmann","raw_affiliation_strings":["Department of Computer Science, University of Erlangen-Nuremberg, 91058, Erlangen, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Erlangen-Nuremberg, 91058, Erlangen, Germany","institution_ids":["https://openalex.org/I181369854"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082552227","display_name":"Georg Hager","orcid":"https://orcid.org/0000-0002-8723-2781"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Georg Hager","raw_affiliation_strings":["Erlangen Regional Computing Center (RRZE), 91058, Erlangen, Germany"],"affiliations":[{"raw_affiliation_string":"Erlangen Regional Computing Center (RRZE), 91058, Erlangen, Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108081461","display_name":"Holger Fehske","orcid":"https://orcid.org/0000-0003-2146-8203"},"institutions":[{"id":"https://openalex.org/I36522303","display_name":"Universit\u00e4t Greifswald","ror":"https://ror.org/00r1edq15","country_code":"DE","type":"education","lineage":["https://openalex.org/I36522303"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Holger Fehske","raw_affiliation_strings":["Institute of Physics, University of Greifswald, 17489, Greifswald, Germany"],"affiliations":[{"raw_affiliation_string":"Institute of Physics, University of Greifswald, 17489, Greifswald, Germany","institution_ids":["https://openalex.org/I36522303"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113506287","display_name":"A. R. Bishop","orcid":"https://orcid.org/0009-0002-4781-387X"},"institutions":[{"id":"https://openalex.org/I1343871089","display_name":"Los Alamos National Laboratory","ror":"https://ror.org/01e41cf67","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I1343871089","https://openalex.org/I198811213","https://openalex.org/I4210120050"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alan R. Bishop","raw_affiliation_strings":["Science, Technology and Engineering Directorate, Los Alamos National Laboratory, Los Alamos, USA"],"affiliations":[{"raw_affiliation_string":"Science, Technology and Engineering Directorate, Los Alamos National Laboratory, Los Alamos, USA","institution_ids":["https://openalex.org/I1343871089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070209050","display_name":"Gerhard Wellein","orcid":"https://orcid.org/0000-0001-7371-3026"},"institutions":[{"id":"https://openalex.org/I181369854","display_name":"Friedrich-Alexander-Universit\u00e4t Erlangen-N\u00fcrnberg","ror":"https://ror.org/00f7hpc57","country_code":"DE","type":"education","lineage":["https://openalex.org/I181369854"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gerhard Wellein","raw_affiliation_strings":["Department of Computer Science, University of Erlangen-Nuremberg, 91058, Erlangen, Germany","Erlangen Regional Computing Center (RRZE), 91058, Erlangen, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Erlangen-Nuremberg, 91058, Erlangen, Germany","institution_ids":["https://openalex.org/I181369854"]},{"raw_affiliation_string":"Erlangen Regional Computing Center (RRZE), 91058, Erlangen, Germany","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5058357790"],"corresponding_institution_ids":[],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":{"value":5000,"currency":"EUR","value_usd":5392},"fwci":11.433,"has_fulltext":true,"cited_by_count":22,"citation_normalized_percentile":{"value":0.9900722,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"412","last_page":"433"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10363","display_name":"Low-power high-performance VLSI design","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8908033967018127},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.804814338684082},{"id":"https://openalex.org/keywords/x86","display_name":"x86","score":0.7379047274589539},{"id":"https://openalex.org/keywords/cascade","display_name":"Cascade","score":0.6089204549789429},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5712551474571228},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4971354305744171},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.47280898690223694},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.46113574504852295},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4577428996562958},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.44806140661239624},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.425694078207016},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.41994109749794006},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.29808056354522705},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07342016696929932}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8908033967018127},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.804814338684082},{"id":"https://openalex.org/C170723468","wikidata":"https://www.wikidata.org/wiki/Q182933","display_name":"x86","level":3,"score":0.7379047274589539},{"id":"https://openalex.org/C34146451","wikidata":"https://www.wikidata.org/wiki/Q5048094","display_name":"Cascade","level":2,"score":0.6089204549789429},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5712551474571228},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4971354305744171},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.47280898690223694},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.46113574504852295},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4577428996562958},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.44806140661239624},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.425694078207016},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.41994109749794006},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.29808056354522705},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07342016696929932},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1007/978-3-030-50743-5_21","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-50743-5_21","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-030-50743-5_21.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:arXiv.org:2002.03344","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2002.03344","pdf_url":"https://arxiv.org/pdf/2002.03344","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:eref.uni-bayreuth.de:66748","is_oa":true,"landing_page_url":null,"pdf_url":"https://arxiv.org/abs/2002.03344","source":{"id":"https://openalex.org/S4377196442","display_name":"ERef Bayreuth (University of Bayreuth)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I54009628","host_organization_name":"University of Bayreuth","host_organization_lineage":["https://openalex.org/I54009628"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Artikel in einer Zeitschrift"},{"id":"pmh:oai:pubmedcentral.nih.gov:7295341","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/7295341","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"High Performance Computing","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1007/978-3-030-50743-5_21","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-50743-5_21","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-030-50743-5_21.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"sustainable_development_goals":[{"score":0.6600000262260437,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G2157692340","display_name":"Verbundprojekt: SeASiTe - Selbstadaption f\u00fcr zeitschrittbasierte Simulationstechniken auf heterogenen HPC-Systemen","funder_award_id":"01IH16012C","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G352791218","display_name":null,"funder_award_id":"(BMBF)","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G7225624288","display_name":null,"funder_award_id":"This work was","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3005380678.pdf","grobid_xml":"https://content.openalex.org/works/W3005380678.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W35088483","https://openalex.org/W858404628","https://openalex.org/W2025564310","https://openalex.org/W2035080386","https://openalex.org/W2058022120","https://openalex.org/W2105321788","https://openalex.org/W2124350608","https://openalex.org/W2150319905","https://openalex.org/W2211971732","https://openalex.org/W2257508639","https://openalex.org/W2486056921","https://openalex.org/W2582675761","https://openalex.org/W2593836394","https://openalex.org/W2791494644","https://openalex.org/W2795096332","https://openalex.org/W2899324948","https://openalex.org/W2913716454","https://openalex.org/W2957142384","https://openalex.org/W2962978274","https://openalex.org/W3037519583","https://openalex.org/W3086476857","https://openalex.org/W3100119968","https://openalex.org/W3102705131","https://openalex.org/W3122375428"],"related_works":["https://openalex.org/W2153719181","https://openalex.org/W2384867379","https://openalex.org/W1971748923","https://openalex.org/W3215381467","https://openalex.org/W4301207796","https://openalex.org/W1566155057","https://openalex.org/W1980322368","https://openalex.org/W2096357811","https://openalex.org/W2072005592","https://openalex.org/W2119413962"],"abstract_inverted_index":{"Abstract":[0],"Hardware":[1],"platforms":[2],"in":[3,25,116],"high":[4],"performance":[5,36,85,100,138],"computing":[6],"are":[7,33,37,71],"constantly":[8],"getting":[9],"more":[10],"complex":[11],"to":[12,41,61,96,142,178,182],"handle":[13],"even":[14,39],"when":[15],"considering":[16],"multicore":[17],"CPUs":[18],"alone.":[19],"Numerous":[20],"features":[21],"and":[22,28,74,120,139,146,159,174],"configuration":[23,128],"options":[24],"the":[26,29,57,76,175],"hardware":[27,127],"software":[30],"environment":[31],"that":[32,51,130],"relevant":[34,126,183],"for":[35,99],"not":[38],"known":[40,82],"most":[42],"application":[43,184],"users":[44],"or":[45,84,102],"developers.":[46],"Microbenchmarks,":[47],"i.e.,":[48],"simple":[49],"codes":[50],"fathom":[52],"a":[53,133,180],"particular":[54],"aspect":[55],"of":[56,156],"hardware,":[58],"can":[59,78,131],"help":[60],"shed":[62],"light":[63],"on":[64,136],"such":[65],"issues,":[66],"but":[67],"only":[68],"if":[69,75],"they":[70],"well":[72],"understood":[73],"results":[77],"be":[79,94],"reconciled":[80],"with":[81],"facts":[83],"models.":[86],"The":[87,151],"insight":[88],"gained":[89],"from":[90],"microbenchmarks":[91],"may":[92],"then":[93],"applied":[95],"real":[97],"applications":[98],"analysis":[101],"optimization.":[103],"In":[104],"this":[105],"paper":[106],"we":[107,168],"investigate":[108],"two":[109],"modern":[110],"Intel":[111],"x86":[112],"server":[113],"CPU":[114],"architectures":[115],"depth:":[117],"Broadwell":[118],"EP":[119],"Cascade":[121,157],"Lake":[122,158],"SP.":[123],"We":[124],"highlight":[125],"settings":[129],"have":[132],"decisive":[134],"impact":[135],"code":[137],"show":[140],"how":[141],"properly":[143],"measure":[144],"on-chip":[145],"off-chip":[147],"data":[148],"transfer":[149],"bandwidths.":[150],"new":[152],"victim":[153],"L3":[154],"cache":[155],"its":[160],"advanced":[161],"replacement":[162],"policy":[163],"receive":[164],"due":[165],"attention.":[166],"Finally":[167],"use":[169],"DGEMM,":[170],"sparse":[171],"matrix-vector":[172],"multiplication,":[173],"HPCG":[176],"benchmark":[177],"make":[179],"connection":[181],"scenarios.":[185]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":4}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2020-02-14T00:00:00"}
