{"id":"https://openalex.org/W2340344372","doi":"https://doi.org/10.1177/1094342015626584","title":"An MPI/OpenACC implementation of a high-order electromagnetics solver with GPUDirect communication","display_name":"An MPI/OpenACC implementation of a high-order electromagnetics solver with GPUDirect communication","publication_year":2016,"publication_date":"2016-02-03","ids":{"openalex":"https://openalex.org/W2340344372","doi":"https://doi.org/10.1177/1094342015626584","mag":"2340344372"},"language":"en","primary_location":{"id":"doi:10.1177/1094342015626584","is_oa":false,"landing_page_url":"https://doi.org/10.1177/1094342015626584","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069712328","display_name":"Matthew Otten","orcid":"https://orcid.org/0000-0002-6522-5820"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]},{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Matthew Otten","raw_affiliation_strings":["Department of Physics, Cornell University, Ithaca, NY, USA","Mathematics and Computer Science, Argonne National Laboratory, Lemont, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Physics, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]},{"raw_affiliation_string":"Mathematics and Computer Science, Argonne National Laboratory, Lemont, IL, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100684212","display_name":"Jing Gong","orcid":null},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Jing Gong","raw_affiliation_strings":["KTH Royal Institute of Technology, Stockholm, Sweden"],"affiliations":[{"raw_affiliation_string":"KTH Royal Institute of Technology, Stockholm, Sweden","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074668365","display_name":"Azamat Mametjanov","orcid":"https://orcid.org/0000-0001-7316-4231"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Azamat Mametjanov","raw_affiliation_strings":["Mathematics and Computer Science, Argonne National Laboratory, Lemont, IL, USA"],"affiliations":[{"raw_affiliation_string":"Mathematics and Computer Science, Argonne National Laboratory, Lemont, IL, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057057413","display_name":"Aaron Vose","orcid":null},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aaron Vose","raw_affiliation_strings":["Cray\u2019s Suercomputing Cener of Excellence, Oak Ridge National Laboratory, Oak Ridge, TN, USA","Cray's Suercomputing Cener of Excellence, Oak Ridge National Laboratory, Oak Ridge, TN, USA"],"affiliations":[{"raw_affiliation_string":"Cray\u2019s Suercomputing Cener of Excellence, Oak Ridge National Laboratory, Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]},{"raw_affiliation_string":"Cray's Suercomputing Cener of Excellence, Oak Ridge National Laboratory, Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052750317","display_name":"John Levesque","orcid":"https://orcid.org/0000-0001-5342-4358"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"John Levesque","raw_affiliation_strings":["Cray\u2019s Suercomputing Cener of Excellence, Oak Ridge National Laboratory, Oak Ridge, TN, USA","Cray's Suercomputing Cener of Excellence, Oak Ridge National Laboratory, Oak Ridge, TN, USA"],"affiliations":[{"raw_affiliation_string":"Cray\u2019s Suercomputing Cener of Excellence, Oak Ridge National Laboratory, Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]},{"raw_affiliation_string":"Cray's Suercomputing Cener of Excellence, Oak Ridge National Laboratory, Oak Ridge, TN, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081088881","display_name":"Paul Fischer","orcid":"https://orcid.org/0000-0002-6506-4502"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]},{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paul Fischer","raw_affiliation_strings":["Department of Computer Science, Univerisity of Illinois at Urbana\u2013Champaign, Champaign, IL, USA","Department of Mechanical Engineering, Univerisity of Illinois at Urbana\u2013Champaign, Champaign, IL, USA","Mathematics and Computer Science, Argonne National Laboratory, Lemont, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Univerisity of Illinois at Urbana\u2013Champaign, Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"Department of Mechanical Engineering, Univerisity of Illinois at Urbana\u2013Champaign, Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"Mathematics and Computer Science, Argonne National Laboratory, Lemont, IL, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029616613","display_name":"Misun Min","orcid":"https://orcid.org/0000-0002-5646-5689"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Misun Min","raw_affiliation_strings":["Mathematics and Computer Science, Argonne National Laboratory, Lemont, IL, USA"],"affiliations":[{"raw_affiliation_string":"Mathematics and Computer Science, Argonne National Laboratory, Lemont, IL, USA","institution_ids":["https://openalex.org/I1282105669"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5029616613"],"corresponding_institution_ids":["https://openalex.org/I1282105669"],"apc_list":null,"apc_paid":null,"fwci":5.9287,"has_fulltext":false,"cited_by_count":38,"citation_normalized_percentile":{"value":0.963698,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"30","issue":"3","first_page":"320","last_page":"334"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10339","display_name":"Advanced Numerical Methods in Computational Mathematics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10339","display_name":"Advanced Numerical Methods in Computational Mathematics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11263","display_name":"Electromagnetic Simulation and Numerical Methods","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11416","display_name":"Numerical methods for differential equations","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/2612","display_name":"Numerical Analysis"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7892155647277832},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.7305719256401062},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7146350145339966},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.6809272766113281},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.6616609692573547},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.6476043462753296},{"id":"https://openalex.org/keywords/discretization","display_name":"Discretization","score":0.5298293232917786},{"id":"https://openalex.org/keywords/graphics-processing-unit","display_name":"Graphics processing unit","score":0.5212976932525635},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.5129825472831726},{"id":"https://openalex.org/keywords/message-passing","display_name":"Message passing","score":0.4855744242668152},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.46387872099876404},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.45892906188964844},{"id":"https://openalex.org/keywords/message-passing-interface","display_name":"Message Passing Interface","score":0.4247710406780243},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.41414016485214233},{"id":"https://openalex.org/keywords/precomputation","display_name":"Precomputation","score":0.4136985242366791},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.3223422169685364},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2187844216823578},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1081838607788086}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7892155647277832},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.7305719256401062},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7146350145339966},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.6809272766113281},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.6616609692573547},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.6476043462753296},{"id":"https://openalex.org/C73000952","wikidata":"https://www.wikidata.org/wiki/Q17007827","display_name":"Discretization","level":2,"score":0.5298293232917786},{"id":"https://openalex.org/C2779851693","wikidata":"https://www.wikidata.org/wiki/Q183484","display_name":"Graphics processing unit","level":2,"score":0.5212976932525635},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.5129825472831726},{"id":"https://openalex.org/C854659","wikidata":"https://www.wikidata.org/wiki/Q1859284","display_name":"Message passing","level":2,"score":0.4855744242668152},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.46387872099876404},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.45892906188964844},{"id":"https://openalex.org/C166782233","wikidata":"https://www.wikidata.org/wiki/Q127879","display_name":"Message Passing Interface","level":3,"score":0.4247710406780243},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.41414016485214233},{"id":"https://openalex.org/C159379195","wikidata":"https://www.wikidata.org/wiki/Q7239568","display_name":"Precomputation","level":3,"score":0.4136985242366791},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.3223422169685364},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2187844216823578},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1081838607788086},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/1094342015626584","is_oa":false,"landing_page_url":"https://doi.org/10.1177/1094342015626584","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4000000059604645,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W17056376","https://openalex.org/W1583515859","https://openalex.org/W2064037873","https://openalex.org/W2090843874","https://openalex.org/W2109241917","https://openalex.org/W2120919211","https://openalex.org/W2969262004"],"related_works":["https://openalex.org/W2566637483","https://openalex.org/W2127324789","https://openalex.org/W3024308452","https://openalex.org/W4244894488","https://openalex.org/W4285390450","https://openalex.org/W2090268225","https://openalex.org/W2366442643","https://openalex.org/W2021715972","https://openalex.org/W2761732860","https://openalex.org/W75461624"],"abstract_inverted_index":{"We":[0,112],"present":[1],"performance":[2,92],"results":[3,69],"and":[4,44,65,116],"an":[5,15],"analysis":[6],"of":[7,14,25,62,77,97,105,120,126],"a":[8,20,38,45],"message":[9],"passing":[10],"interface":[11],"(MPI)/OpenACC":[12],"implementation":[13,32],"electromagnetic":[16],"solver":[17],"based":[18],"on":[19,93],"spectral-element":[21],"discontinuous":[22],"Galerkin":[23],"discretization":[24],"the":[26,78,94,117],"time-dependent":[27],"Maxwell":[28],"equations.":[29],"The":[30],"OpenACC":[31],"covers":[33],"all":[34],"solution":[35],"routines,":[36],"including":[37],"highly":[39],"tuned":[40],"element-by-element":[41],"operator":[42],"evaluation":[43],"GPUDirect":[46],"gather\u2013scatter":[47],"kernel":[48],"to":[49,58,72,107],"effect":[50],"nearest":[51],"neighbor":[52],"flux":[53],"exchanges.":[54],"Modifications":[55],"are":[56],"designed":[57],"make":[59],"effective":[60],"use":[61],"vectorization,":[63],"streaming,":[64],"data":[66],"management.":[67],"Performance":[68],"using":[70],"up":[71,106],"16,384":[73],"graphics":[74],"processing":[75,90],"units":[76],"Cray":[79],"XK7":[80],"supercomputer":[81],"Titan":[82],"show":[83],"more":[84],"than":[85],"2.5\u00d7":[86],"speedup":[87],"over":[88],"central":[89],"unit-only":[91],"same":[95],"number":[96],"nodes":[98],"(262,144":[99],"MPI":[100],"ranks)":[101],"for":[102,123],"problem":[103],"sizes":[104],"6.9":[108],"billion":[109],"grid":[110],"points.":[111],"discuss":[113],"performance-enhancement":[114],"strategies":[115],"overall":[118],"potential":[119],"GPU-based":[121],"computing":[122],"this":[124],"class":[125],"problems.":[127]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":7},{"year":2015,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
