{"id":"https://openalex.org/W4308303350","doi":"https://doi.org/10.1177/10943420221136873","title":"Acceleration of a parallel BDDC solver by using graphics processing units on subdomains","display_name":"Acceleration of a parallel BDDC solver by using graphics processing units on subdomains","publication_year":2022,"publication_date":"2022-11-05","ids":{"openalex":"https://openalex.org/W4308303350","doi":"https://doi.org/10.1177/10943420221136873"},"language":"en","primary_location":{"id":"doi:10.1177/10943420221136873","is_oa":false,"landing_page_url":"https://doi.org/10.1177/10943420221136873","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057184591","display_name":"Jakub \u0160\u00edstek","orcid":"https://orcid.org/0000-0002-5231-7830"},"institutions":[{"id":"https://openalex.org/I4210120266","display_name":"Czech Academy of Sciences, Institute of Mathematics","ror":"https://ror.org/02tv1yf50","country_code":"CZ","type":"facility","lineage":["https://openalex.org/I202391551","https://openalex.org/I4210120266"]},{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":true,"raw_author_name":"Jakub \u0160\u00edstek","raw_affiliation_strings":["Czech Technical University in Prague, Czech Republic","Institute of Mathematics of the Czech Academy of Sciences, Prague, Czech Republic"],"raw_orcid":"https://orcid.org/0000-0002-5231-7830","affiliations":[{"raw_affiliation_string":"Czech Technical University in Prague, Czech Republic","institution_ids":["https://openalex.org/I44504214"]},{"raw_affiliation_string":"Institute of Mathematics of the Czech Academy of Sciences, Prague, Czech Republic","institution_ids":["https://openalex.org/I4210120266"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077560959","display_name":"Tom\u00e1\u0161 Oberhuber","orcid":"https://orcid.org/0000-0001-8374-6892"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Tom\u00e1\u0161 Oberhuber","raw_affiliation_strings":["Czech Technical University in Prague, Czech Republic"],"raw_orcid":"https://orcid.org/0000-0001-8374-6892","affiliations":[{"raw_affiliation_string":"Czech Technical University in Prague, Czech Republic","institution_ids":["https://openalex.org/I44504214"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5057184591"],"corresponding_institution_ids":["https://openalex.org/I4210120266","https://openalex.org/I44504214"],"apc_list":null,"apc_paid":null,"fwci":0.6642,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.62790627,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"37","issue":"2","first_page":"151","last_page":"164"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10339","display_name":"Advanced Numerical Methods in Computational Mathematics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10339","display_name":"Advanced Numerical Methods in Computational Mathematics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11254","display_name":"Fluid Dynamics and Vibration Analysis","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.7441925406455994},{"id":"https://openalex.org/keywords/schur-complement","display_name":"Schur complement","score":0.7324591875076294},{"id":"https://openalex.org/keywords/domain-decomposition-methods","display_name":"Domain decomposition methods","score":0.6285055875778198},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5469799041748047},{"id":"https://openalex.org/keywords/saddle-point","display_name":"Saddle point","score":0.4535532593727112},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.439653605222702},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.43020206689834595},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.42910251021385193},{"id":"https://openalex.org/keywords/krylov-subspace","display_name":"Krylov subspace","score":0.4220714271068573},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.36247146129608154},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.20894384384155273},{"id":"https://openalex.org/keywords/finite-element-method","display_name":"Finite element method","score":0.1932843029499054},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.16049781441688538},{"id":"https://openalex.org/keywords/eigenvalues-and-eigenvectors","display_name":"Eigenvalues and eigenvectors","score":0.15285053849220276},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.13190844655036926}],"concepts":[{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.7441925406455994},{"id":"https://openalex.org/C2731191","wikidata":"https://www.wikidata.org/wiki/Q1778169","display_name":"Schur complement","level":3,"score":0.7324591875076294},{"id":"https://openalex.org/C198880260","wikidata":"https://www.wikidata.org/wiki/Q5289813","display_name":"Domain decomposition methods","level":3,"score":0.6285055875778198},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5469799041748047},{"id":"https://openalex.org/C2681867","wikidata":"https://www.wikidata.org/wiki/Q690935","display_name":"Saddle point","level":2,"score":0.4535532593727112},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.439653605222702},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.43020206689834595},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.42910251021385193},{"id":"https://openalex.org/C147060835","wikidata":"https://www.wikidata.org/wiki/Q1757151","display_name":"Krylov subspace","level":3,"score":0.4220714271068573},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.36247146129608154},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.20894384384155273},{"id":"https://openalex.org/C135628077","wikidata":"https://www.wikidata.org/wiki/Q220184","display_name":"Finite element method","level":2,"score":0.1932843029499054},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.16049781441688538},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.15285053849220276},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.13190844655036926},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/10943420221136873","is_oa":false,"landing_page_url":"https://doi.org/10.1177/10943420221136873","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G56741756","display_name":null,"funder_award_id":"20-01074S","funder_id":"https://openalex.org/F4320321006","funder_display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky"},{"id":"https://openalex.org/G8634377710","display_name":null,"funder_award_id":"RVO:67985840","funder_id":"https://openalex.org/F4320322482","funder_display_name":"Akademie V\u011bd \u010cesk\u00e9 Republiky"}],"funders":[{"id":"https://openalex.org/F4320321006","display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky","ror":"https://ror.org/01pv73b02"},{"id":"https://openalex.org/F4320322482","display_name":"Akademie V\u011bd \u010cesk\u00e9 Republiky","ror":"https://ror.org/053avzc18"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W133977063","https://openalex.org/W1548589512","https://openalex.org/W1978480412","https://openalex.org/W1991532854","https://openalex.org/W2000867371","https://openalex.org/W2016279572","https://openalex.org/W2021157069","https://openalex.org/W2024179839","https://openalex.org/W2036019258","https://openalex.org/W2038469228","https://openalex.org/W2057711597","https://openalex.org/W2071489648","https://openalex.org/W2089861738","https://openalex.org/W2103486983","https://openalex.org/W2106619956","https://openalex.org/W2133248904","https://openalex.org/W2270752444","https://openalex.org/W3134485366","https://openalex.org/W4229666556"],"related_works":["https://openalex.org/W2024188915","https://openalex.org/W2028160813","https://openalex.org/W2004765749","https://openalex.org/W3031624508","https://openalex.org/W4380758601","https://openalex.org/W2024362124","https://openalex.org/W2551573654","https://openalex.org/W1991285463","https://openalex.org/W2007579628","https://openalex.org/W2604862712"],"abstract_inverted_index":{"An":[0],"approach":[1,167],"to":[2,49,85,141,168,174],"accelerating":[3],"a":[4,32,132,178],"parallel":[5],"domain":[6],"decomposition":[7],"(DD)":[8],"solver":[9,18],"by":[10,27,43,58],"graphics":[11],"processing":[12],"units":[13],"(GPUs)":[14],"is":[15,19,31,138],"investigated.":[16],"The":[17,136,160],"based":[20],"on":[21,119,131],"the":[22,59,70,77,80,93,97,111,127,149,163,166],"Balancing":[23],"Domain":[24],"Decomposition":[25],"Method":[26],"Constraints":[28],"(BDDC),":[29],"which":[30],"nonoverlapping":[33],"DD":[34],"technique.":[35],"Two":[36],"kinds":[37],"of":[38,53,69,89,96,123,126,145,165],"local":[39,50,71,81,90],"matrices":[40,47,82,115],"are":[41,56,64,83,100,116,129,153],"required":[42],"BDDC.":[44,75],"First,":[45],"dense":[46,94,112],"corresponding":[48],"Schur":[51,98],"complements":[52],"interior":[54],"unknowns":[55],"constructed":[57],"sparse":[60],"direct":[61],"solver.":[62],"These":[63],"further":[65],"used":[66],"as":[67],"part":[68],"saddle-point":[72,113],"problems":[73],"within":[74],"In":[76,105],"next":[78],"step,":[79],"copied":[84],"GPUs.":[86,120],"Repeated":[87],"multiplications":[88],"vectors":[91],"with":[92,110,177],"matrix":[95],"complement":[99],"performed":[101,118,154],"for":[102],"each":[103,157],"subdomain.":[104],"addition,":[106],"factorizations":[107],"and":[108],"backsubstitutions":[109],"subdomain":[114],"also":[117,139],"Detailed":[121],"times":[122,176],"main":[124],"components":[125],"algorithm":[128],"measured":[130],"benchmark":[133],"Poisson":[134],"problem.":[135],"method":[137],"applied":[140],"an":[142],"unsteady":[143],"problem":[144],"incompressible":[146],"flow,":[147],"where":[148],"Krylov":[150],"subspace":[151],"iterations":[152],"repeatedly":[155],"in":[156],"time":[158],"step.":[159],"results":[161],"demonstrate":[162],"potential":[164],"speed":[169],"up":[170,173],"realistic":[171],"simulations":[172],"5":[175],"preference":[179],"towards":[180],"large":[181],"subdomains.":[182]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-18T08:10:14.011955","created_date":"2025-10-10T00:00:00"}
