{"id":"https://openalex.org/W2963896930","doi":"https://doi.org/10.3233/978-1-61499-843-3-47","title":"Porting of the DBCSR Library for Sparse Matrix-Matrix Multiplications to Intel Xeon Phi Systems","display_name":"Porting of the DBCSR Library for Sparse Matrix-Matrix Multiplications to Intel Xeon Phi Systems","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2963896930","doi":"https://doi.org/10.3233/978-1-61499-843-3-47","mag":"2963896930"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-61499-843-3-47","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-843-3-47","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028832623","display_name":"Iain Bethune","orcid":"https://orcid.org/0000-0003-0713-2084"},"institutions":[{"id":"https://openalex.org/I2802015276","display_name":"Daresbury Laboratory","ror":"https://ror.org/0089bg420","country_code":"GB","type":"facility","lineage":["https://openalex.org/I162524378","https://openalex.org/I2802015276","https://openalex.org/I4210087105"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Bethune Iain","raw_affiliation_strings":["Daresbury Laboratory, Daresbury, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Daresbury Laboratory, Daresbury, United Kingdom","institution_ids":["https://openalex.org/I2802015276"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051171407","display_name":"Andreas Gl\u00f6\u00df","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gl&ouml;ss Andreas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045830246","display_name":"J\u00fcrg Hutter","orcid":"https://orcid.org/0000-0002-6887-8229"},"institutions":[{"id":"https://openalex.org/I202697423","display_name":"University of Zurich","ror":"https://ror.org/02crff812","country_code":"CH","type":"education","lineage":["https://openalex.org/I202697423"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Hutter J&uuml;rg","raw_affiliation_strings":["University of Zurich, Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"University of Zurich, Zurich, Switzerland","institution_ids":["https://openalex.org/I202697423"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101815936","display_name":"Alfio Lazzaro","orcid":"https://orcid.org/0000-0003-4256-8270"},"institutions":[{"id":"https://openalex.org/I189158943","display_name":"University of Milan","ror":"https://ror.org/00wjc7c48","country_code":"IT","type":"education","lineage":["https://openalex.org/I189158943"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Lazzaro Alfio","raw_affiliation_strings":["University of Milan, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"University of Milan, Milan, Italy","institution_ids":["https://openalex.org/I189158943"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072681045","display_name":"Hans Pabst","orcid":null},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pabst Hans","raw_affiliation_strings":["Intel (United States), Santa Clara, United States"],"affiliations":[{"raw_affiliation_string":"Intel (United States), Santa Clara, United States","institution_ids":["https://openalex.org/I1343180700"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103385886","display_name":"Fiona Reid","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Reid Fiona","raw_affiliation_strings":["University of Edinburgh, Edinburgh, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh, Edinburgh, United Kingdom","institution_ids":["https://openalex.org/I98677209"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5028832623"],"corresponding_institution_ids":["https://openalex.org/I2802015276"],"apc_list":null,"apc_paid":null,"fwci":1.2773,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.81506849,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.8922603726387024},{"id":"https://openalex.org/keywords/porting","display_name":"Porting","score":0.8392101526260376},{"id":"https://openalex.org/keywords/xeon","display_name":"Xeon","score":0.7844548225402832},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6836358904838562},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6787700057029724},{"id":"https://openalex.org/keywords/linear-algebra","display_name":"Linear algebra","score":0.5643948316574097},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.5437487363815308},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.5072593092918396},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.47718942165374756},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.46137556433677673},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.44221773743629456},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.39128896594047546},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.171941339969635},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.0981922447681427},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.0950126051902771},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.08750161528587341},{"id":"https://openalex.org/keywords/computational-chemistry","display_name":"Computational chemistry","score":0.06691133975982666},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.05870512127876282},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.05824202299118042}],"concepts":[{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.8922603726387024},{"id":"https://openalex.org/C106251023","wikidata":"https://www.wikidata.org/wiki/Q851989","display_name":"Porting","level":3,"score":0.8392101526260376},{"id":"https://openalex.org/C145108525","wikidata":"https://www.wikidata.org/wiki/Q656154","display_name":"Xeon","level":2,"score":0.7844548225402832},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6836358904838562},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6787700057029724},{"id":"https://openalex.org/C139352143","wikidata":"https://www.wikidata.org/wiki/Q82571","display_name":"Linear algebra","level":2,"score":0.5643948316574097},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.5437487363815308},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.5072593092918396},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.47718942165374756},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.46137556433677673},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.44221773743629456},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.39128896594047546},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.171941339969635},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0981922447681427},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0950126051902771},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.08750161528587341},{"id":"https://openalex.org/C147597530","wikidata":"https://www.wikidata.org/wiki/Q369472","display_name":"Computational chemistry","level":1,"score":0.06691133975982666},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.05870512127876282},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.05824202299118042},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/978-1-61499-843-3-47","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-843-3-47","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2147910609","https://openalex.org/W2609613932","https://openalex.org/W2008373862","https://openalex.org/W2475524688","https://openalex.org/W2739740241","https://openalex.org/W2085105049","https://openalex.org/W2592417500","https://openalex.org/W1974923383","https://openalex.org/W2331803692","https://openalex.org/W2466690044"],"abstract_inverted_index":{"Multiplication":[0],"of":[1,12,16,20,82,89],"two":[2],"sparse":[3,27,45],"matrices":[4],"is":[5,50,69],"a":[6,86],"key":[7],"operation":[8],"in":[9,66],"the":[10,13,51],"simulation":[11],"electronic":[14,58],"structure":[15,59],"systems":[17,92,104,110],"containing":[18],"thousands":[19],"atoms":[21],"and":[22,61,73,75],"electrons.":[23],"The":[24],"highly":[25],"optimized":[26],"linear":[28,56],"algebra":[29],"library":[30,49],"DBCSR":[31,90],"(Distributed":[32],"Block":[33],"Compressed":[34],"Sparse":[35],"Row)":[36],"has":[37],"been":[38],"specifically":[39],"designed":[40],"to":[41,103],"efficiently":[42],"perform":[43],"such":[44],"matrix-matrix":[46],"multiplications.":[47],"This":[48],"basic":[52],"building":[53],"block":[54],"for":[55],"scaling":[57,63],"theory":[60],"low":[62],"correlated":[64],"methods":[65],"CP2K.":[67],"It":[68],"parallelized":[70],"using":[71],"MPI":[72],"OpenMP,":[74],"can":[76],"exploit":[77],"GPU":[78],"accelerators":[79],"by":[80],"means":[81],"CUDA.":[83],"We":[84],"describe":[85],"performance":[87],"comparison":[88],"on":[91],"with":[93,101,105,111],"Intel":[94,106],"Xeon":[95,107],"Phi":[96],"Knights":[97],"Landing":[98],"(KNL)":[99],"processors,":[100],"respect":[102],"CPUs":[108],"(including":[109],"GPUs).":[112]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
