{"id":"https://openalex.org/W2902973073","doi":"https://doi.org/10.1109/hpec.2018.8547542","title":"AMulti-GPU PCISPH Implementation with Efficient Memory Transfers","display_name":"AMulti-GPU PCISPH Implementation with Efficient Memory Transfers","publication_year":2018,"publication_date":"2018-09-01","ids":{"openalex":"https://openalex.org/W2902973073","doi":"https://doi.org/10.1109/hpec.2018.8547542","mag":"2902973073"},"language":"en","primary_location":{"id":"doi:10.1109/hpec.2018.8547542","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpec.2018.8547542","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE High Performance extreme Computing Conference (HPEC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012499296","display_name":"Kevin Verma","orcid":"https://orcid.org/0000-0002-8058-7520"},"institutions":[{"id":"https://openalex.org/I121883995","display_name":"Johannes Kepler University of Linz","ror":"https://ror.org/052r2xn60","country_code":"AT","type":"education","lineage":["https://openalex.org/I121883995"]}],"countries":["AT"],"is_corresponding":true,"raw_author_name":"Kevin Verma","raw_affiliation_strings":["Institute for Integrated Circuits, Johannes Kepler University, Linz, Austria"],"affiliations":[{"raw_affiliation_string":"Institute for Integrated Circuits, Johannes Kepler University, Linz, Austria","institution_ids":["https://openalex.org/I121883995"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120312334","display_name":"Chong Peng","orcid":"https://orcid.org/0000-0002-6083-2656"},"institutions":[{"id":"https://openalex.org/I4210110916","display_name":"Engineering Software Steyr (Austria)","ror":"https://ror.org/0175s4d43","country_code":"AT","type":"company","lineage":["https://openalex.org/I4210110916"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Chong Peng","raw_affiliation_strings":["ESS Engineering Software Steyr GmbH, Austria"],"affiliations":[{"raw_affiliation_string":"ESS Engineering Software Steyr GmbH, Austria","institution_ids":["https://openalex.org/I4210110916"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056958186","display_name":"Kamil Szewc","orcid":"https://orcid.org/0000-0002-9080-1551"},"institutions":[{"id":"https://openalex.org/I4210110916","display_name":"Engineering Software Steyr (Austria)","ror":"https://ror.org/0175s4d43","country_code":"AT","type":"company","lineage":["https://openalex.org/I4210110916"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Kamil Szewc","raw_affiliation_strings":["ESS Engineering Software Steyr GmbH, Austria"],"affiliations":[{"raw_affiliation_string":"ESS Engineering Software Steyr GmbH, Austria","institution_ids":["https://openalex.org/I4210110916"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004214923","display_name":"Robert Wille","orcid":"https://orcid.org/0000-0002-4993-7860"},"institutions":[{"id":"https://openalex.org/I121883995","display_name":"Johannes Kepler University of Linz","ror":"https://ror.org/052r2xn60","country_code":"AT","type":"education","lineage":["https://openalex.org/I121883995"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Robert Wille","raw_affiliation_strings":["Institute for Integrated Circuits, Johannes Kepler University, Linz, Austria"],"affiliations":[{"raw_affiliation_string":"Institute for Integrated Circuits, Johannes Kepler University, Linz, Austria","institution_ids":["https://openalex.org/I121883995"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5012499296"],"corresponding_institution_ids":["https://openalex.org/I121883995"],"apc_list":null,"apc_paid":null,"fwci":1.4187,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.80033189,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11694","display_name":"Fluid Dynamics Simulations and Interactions","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11694","display_name":"Fluid Dynamics Simulations and Interactions","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11751","display_name":"Lattice Boltzmann Simulation Studies","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11382","display_name":"Fluid Dynamics and Heat Transfer","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8528957962989807},{"id":"https://openalex.org/keywords/smoothed-particle-hydrodynamics","display_name":"Smoothed-particle hydrodynamics","score":0.6889045238494873},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6754498481750488},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6630858182907104},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6077756881713867},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.5788825154304504},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5216907858848572},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.46160808205604553},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.4439203441143036},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.4244150221347809},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3335449993610382},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07910910248756409}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8528957962989807},{"id":"https://openalex.org/C122564879","wikidata":"https://www.wikidata.org/wiki/Q733073","display_name":"Smoothed-particle hydrodynamics","level":2,"score":0.6889045238494873},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6754498481750488},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6630858182907104},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6077756881713867},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.5788825154304504},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5216907858848572},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.46160808205604553},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4439203441143036},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.4244150221347809},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3335449993610382},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07910910248756409},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C57879066","wikidata":"https://www.wikidata.org/wiki/Q41217","display_name":"Mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpec.2018.8547542","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpec.2018.8547542","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE High Performance extreme Computing Conference (HPEC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.4699999988079071,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320323031","display_name":"\u00d6sterreichische Forschungsf\u00f6rderungsgesellschaft","ror":"https://ror.org/028jc0449"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1503550591","https://openalex.org/W1975615012","https://openalex.org/W1976697629","https://openalex.org/W1980938760","https://openalex.org/W1994439127","https://openalex.org/W2008803661","https://openalex.org/W2044355921","https://openalex.org/W2044602433","https://openalex.org/W2045670663","https://openalex.org/W2060240696","https://openalex.org/W2114987640","https://openalex.org/W2131057369","https://openalex.org/W2139238466","https://openalex.org/W2168414272","https://openalex.org/W2321310861","https://openalex.org/W2766757481","https://openalex.org/W2899416081","https://openalex.org/W3116923327","https://openalex.org/W4211072219","https://openalex.org/W4234167293","https://openalex.org/W6630063115"],"related_works":["https://openalex.org/W17155033","https://openalex.org/W4379644454","https://openalex.org/W3207760230","https://openalex.org/W3189307731","https://openalex.org/W2949962288","https://openalex.org/W2364686214","https://openalex.org/W1428699136","https://openalex.org/W1998560227","https://openalex.org/W2026263283","https://openalex.org/W2022772718"],"abstract_inverted_index":{"Smoothed":[0],"Particle":[1],"Hydrodynamics":[2],"(SPH)":[3],"is":[4,17,79],"a":[5,24,50,97,117,128],"particle-based":[6,45],"method":[7,104],"for":[8,112,120],"fluid":[9],"flow":[10],"modeling.":[11],"One":[12],"promising":[13],"variant":[14],"of":[15,39,63,86,93,154,161],"SPH":[16,20,33,71],"Predictive-Corrective":[18],"Incompressible":[19],"(PCISPH),":[21],"which":[22,130],"employs":[23],"dedicate":[25],"prediction-correction":[26],"scheme":[27,129],"and,":[28,142],"by":[29,35,139,143,149],"this,":[30,144],"outperforms":[31],"other":[32,44],"variants":[34],"almost":[36],"one":[37],"order":[38,55],"magnitude.":[40],"However,":[41,89],"similar":[42],"to":[43,56,66,73,82,100,132],"methods,":[46],"it":[47,78,96],"suffers":[48],"from":[49],"huge":[51],"numerical":[52],"complexity.":[53],"In":[54,107],"simulate":[57],"real":[58,74],"world":[59,75],"phenomena,":[60],"several":[61],"millions":[62],"particles":[64],"need":[65],"be":[67],"considered.":[68],"To":[69,122],"make":[70,95],"applicable":[72],"engineering":[76],"problems,":[77],"hence":[80],"common":[81],"exploit":[83],"massive":[84],"parallelism":[85],"multi-GPU":[87,118],"architectures.":[88],"certain":[90],"algorithmic":[91,152],"characteristics":[92,153],"PCISPH":[94],"non-trivial":[98],"task":[99],"efficiently":[101],"parallelize":[102],"this":[103,108,123],"on":[105],"multi-GPUs.":[106],"work,":[109],"we":[110,125],"are,":[111],"the":[113,134,146,150,159,162],"first":[114],"time,":[115],"proposing":[116,127],"implementation":[119],"PCISPH.":[121,155],"end,":[124],"are":[126],"allows":[131],"overlap":[133],"memory":[135],"transfers":[136],"between":[137],"GPUs":[138],"actual":[140],"computations":[141],"avoids":[145],"drawbacks":[147],"caused":[148],"mentioned":[151],"Experimental":[156],"evaluations":[157],"confirm":[158],"efficiency":[160],"proposed":[163],"methods.":[164]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
