{"id":"https://openalex.org/W2893158683","doi":"https://doi.org/10.1002/cpe.4964","title":"Optimized all\u2010to\u2010all communication on multicore architectures applied to FFTs with pencil decomposition","display_name":"Optimized all\u2010to\u2010all communication on multicore architectures applied to FFTs with pencil decomposition","publication_year":2018,"publication_date":"2018-09-27","ids":{"openalex":"https://openalex.org/W2893158683","doi":"https://doi.org/10.1002/cpe.4964","mag":"2893158683"},"language":"en","primary_location":{"id":"doi:10.1002/cpe.4964","is_oa":false,"landing_page_url":"https://doi.org/10.1002/cpe.4964","pdf_url":null,"source":{"id":"https://openalex.org/S11065456","display_name":"Concurrency and Computation Practice and Experience","issn_l":"1532-0626","issn":["1532-0626","1532-0634"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Concurrency and Computation: Practice and Experience","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047832410","display_name":"A. Jocksch","orcid":"https://orcid.org/0000-0002-3327-4230"},"institutions":[{"id":"https://openalex.org/I59105498","display_name":"Swisscom (Switzerland)","ror":"https://ror.org/04t1f4f50","country_code":"CH","type":"company","lineage":["https://openalex.org/I59105498"]},{"id":"https://openalex.org/I4391767926","display_name":"CSCS - Swiss National Supercomputing Centre","ror":"https://ror.org/04rzmms09","country_code":null,"type":"facility","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088","https://openalex.org/I4391767926"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Andreas Jocksch","raw_affiliation_strings":["CSCS Swiss National Supercomputing Centre  Lugano Switzerland","CSCS, Swiss National Supercomputing Centre, Lugano, Switzerland","Andreas Jocksch, CSCS, Swiss National Supercomputing Centre, Via Trevano 131, 6900 Lugano, Switzerland"],"affiliations":[{"raw_affiliation_string":"CSCS Swiss National Supercomputing Centre  Lugano Switzerland","institution_ids":["https://openalex.org/I59105498"]},{"raw_affiliation_string":"CSCS, Swiss National Supercomputing Centre, Lugano, Switzerland","institution_ids":["https://openalex.org/I59105498","https://openalex.org/I4391767926"]},{"raw_affiliation_string":"Andreas Jocksch, CSCS, Swiss National Supercomputing Centre, Via Trevano 131, 6900 Lugano, Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084981761","display_name":"Matthias Kraushaar","orcid":null},"institutions":[{"id":"https://openalex.org/I59105498","display_name":"Swisscom (Switzerland)","ror":"https://ror.org/04t1f4f50","country_code":"CH","type":"company","lineage":["https://openalex.org/I59105498"]},{"id":"https://openalex.org/I4391767926","display_name":"CSCS - Swiss National Supercomputing Centre","ror":"https://ror.org/04rzmms09","country_code":null,"type":"facility","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088","https://openalex.org/I4391767926"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Matthias Kraushaar","raw_affiliation_strings":["CSCS Swiss National Supercomputing Centre  Lugano Switzerland","CSCS, Swiss National Supercomputing Centre, Lugano, Switzerland"],"affiliations":[{"raw_affiliation_string":"CSCS Swiss National Supercomputing Centre  Lugano Switzerland","institution_ids":["https://openalex.org/I59105498"]},{"raw_affiliation_string":"CSCS, Swiss National Supercomputing Centre, Lugano, Switzerland","institution_ids":["https://openalex.org/I59105498","https://openalex.org/I4391767926"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015096033","display_name":"David Daverio","orcid":"https://orcid.org/0000-0002-4693-4891"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I3019243323","display_name":"Center for Theoretical Physics","ror":"https://ror.org/04kfyt897","country_code":"PL","type":"facility","lineage":["https://openalex.org/I3019243323","https://openalex.org/I99542240"]}],"countries":["GB","PL"],"is_corresponding":false,"raw_author_name":"David Daverio","raw_affiliation_strings":["Centre for Theoretical Cosmology, Department of Applied Mathematics and Theoretical Physics University of Cambridge  Cambridge United Kingdom","Centre for Theoretical Cosmology, Department of Applied Mathematics and Theoretical Physics, University of Cambridge, Cambridge, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Centre for Theoretical Cosmology, Department of Applied Mathematics and Theoretical Physics University of Cambridge  Cambridge United Kingdom","institution_ids":["https://openalex.org/I241749","https://openalex.org/I3019243323"]},{"raw_affiliation_string":"Centre for Theoretical Cosmology, Department of Applied Mathematics and Theoretical Physics, University of Cambridge, Cambridge, United Kingdom","institution_ids":["https://openalex.org/I241749"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5047832410"],"corresponding_institution_ids":["https://openalex.org/I4391767926","https://openalex.org/I59105498"],"apc_list":{"value":4740,"currency":"USD","value_usd":4740},"apc_paid":null,"fwci":1.2623,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.78978245,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"31","issue":"16","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8691892623901367},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7229946255683899},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.6653999090194702},{"id":"https://openalex.org/keywords/message-passing-interface","display_name":"Message Passing Interface","score":0.592226505279541},{"id":"https://openalex.org/keywords/message-passing","display_name":"Message passing","score":0.5735281705856323},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5167067050933838},{"id":"https://openalex.org/keywords/shared-memory","display_name":"Shared memory","score":0.4910624027252197},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.4782753884792328},{"id":"https://openalex.org/keywords/distributed-memory","display_name":"Distributed memory","score":0.47786349058151245},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.4757159352302551},{"id":"https://openalex.org/keywords/pencil","display_name":"Pencil (optics)","score":0.44452428817749023},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.435346782207489},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.4174203872680664}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8691892623901367},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7229946255683899},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.6653999090194702},{"id":"https://openalex.org/C166782233","wikidata":"https://www.wikidata.org/wiki/Q127879","display_name":"Message Passing Interface","level":3,"score":0.592226505279541},{"id":"https://openalex.org/C854659","wikidata":"https://www.wikidata.org/wiki/Q1859284","display_name":"Message passing","level":2,"score":0.5735281705856323},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5167067050933838},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.4910624027252197},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.4782753884792328},{"id":"https://openalex.org/C91481028","wikidata":"https://www.wikidata.org/wiki/Q1054686","display_name":"Distributed memory","level":3,"score":0.47786349058151245},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.4757159352302551},{"id":"https://openalex.org/C134949993","wikidata":"https://www.wikidata.org/wiki/Q2068617","display_name":"Pencil (optics)","level":2,"score":0.44452428817749023},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.435346782207489},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.4174203872680664},{"id":"https://openalex.org/C157915830","wikidata":"https://www.wikidata.org/wiki/Q2928001","display_name":"Bubble","level":2,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C129307140","wikidata":"https://www.wikidata.org/wiki/Q6795880","display_name":"Maximum bubble pressure method","level":3,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1002/cpe.4964","is_oa":false,"landing_page_url":"https://doi.org/10.1002/cpe.4964","pdf_url":null,"source":{"id":"https://openalex.org/S11065456","display_name":"Concurrency and Computation Practice and Experience","issn_l":"1532-0626","issn":["1532-0626","1532-0634"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Concurrency and Computation: Practice and Experience","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320924","display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung","ror":"https://ror.org/00yjd3n13"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1814428676","https://openalex.org/W1880687005","https://openalex.org/W1968495897","https://openalex.org/W2043143850","https://openalex.org/W2056476515","https://openalex.org/W2070940137","https://openalex.org/W2078661244","https://openalex.org/W2097215900","https://openalex.org/W2102182691","https://openalex.org/W2131613942","https://openalex.org/W2133557963","https://openalex.org/W2139931691","https://openalex.org/W2141351738","https://openalex.org/W2164374391","https://openalex.org/W2766043324","https://openalex.org/W2787701215","https://openalex.org/W4250705075"],"related_works":["https://openalex.org/W2366325093","https://openalex.org/W1998761481","https://openalex.org/W2498758832","https://openalex.org/W184749201","https://openalex.org/W2154020360","https://openalex.org/W98999783","https://openalex.org/W1544002944","https://openalex.org/W2146236522","https://openalex.org/W2314805133","https://openalex.org/W2133825528"],"abstract_inverted_index":{"Summary":[0],"All\u2010to\u2010all":[1],"communication":[2,9,35],"is":[3,58],"a":[4,34],"basic":[5],"functionality":[6],"of":[7,55,68],"parallel":[8],"libraries":[10],"such":[11],"as":[12],"the":[13,39,69],"Message":[14],"Passing":[15],"Interface":[16],"(MPI).":[17],"Typically,":[18],"there":[19],"are":[20,26],"multiple":[21],"different":[22],"underlying":[23],"algorithms,":[24],"which":[25,37],"chosen":[27],"according":[28],"to":[29,74],"message":[30],"size.":[31],"We":[32],"propose":[33,65],"algorithm,":[36],"exploits":[38],"fact":[40],"that":[41],"modern":[42],"supercomputers":[43],"combine":[44],"shared":[45],"memory":[46,50],"parallelism":[47],"and":[48,77],"distributed":[49],"parallelism.":[51],"The":[52],"application":[53],"example":[54],"our":[56],"algorithm":[57],"FFTs":[59],"with":[60],"pencil":[61],"decomposition.":[62],"Furthermore,":[63],"we":[64],"an":[66,81],"extension":[67],"MPI":[70],"standard":[71],"in":[72,80],"order":[73],"accommodate":[75],"this":[76],"other":[78],"algorithms":[79],"efficient":[82],"way.":[83]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
