{"id":"https://openalex.org/W3097943479","doi":"https://doi.org/10.1177/10943420211017188","title":"A GPU-accelerated adaptive FSAI preconditioner for massively parallel simulations","display_name":"A GPU-accelerated adaptive FSAI preconditioner for massively parallel simulations","publication_year":2021,"publication_date":"2021-05-17","ids":{"openalex":"https://openalex.org/W3097943479","doi":"https://doi.org/10.1177/10943420211017188","mag":"3097943479"},"language":"en","primary_location":{"id":"doi:10.1177/10943420211017188","is_oa":false,"landing_page_url":"https://doi.org/10.1177/10943420211017188","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2010.14175","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030722968","display_name":"Giovanni Isotton","orcid":"https://orcid.org/0000-0002-1548-2378"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Giovanni Isotton","raw_affiliation_strings":["M3E S.r.l., via Giambellino 7, 35129 Paova, Italy"],"affiliations":[{"raw_affiliation_string":"M3E S.r.l., via Giambellino 7, 35129 Paova, Italy","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066565638","display_name":"Carlo Janna","orcid":"https://orcid.org/0000-0001-7286-8122"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Carlo Janna","raw_affiliation_strings":["M3E S.r.l., via Giambellino 7, 35129 Paova, Italy"],"affiliations":[{"raw_affiliation_string":"M3E S.r.l., via Giambellino 7, 35129 Paova, Italy","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006496977","display_name":"Massimo Bernaschi","orcid":"https://orcid.org/0000-0003-3661-9836"},"institutions":[{"id":"https://openalex.org/I3005160176","display_name":"Institute for High Performance Computing and Networking","ror":"https://ror.org/04r5fge26","country_code":"IT","type":"facility","lineage":["https://openalex.org/I3005160176","https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Massimo Bernaschi","raw_affiliation_strings":["Institute for Applied Computing, CNR, 00185 Rome, Italy"],"affiliations":[{"raw_affiliation_string":"Institute for Applied Computing, CNR, 00185 Rome, Italy","institution_ids":["https://openalex.org/I3005160176"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5030722968"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.1508,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.46989891,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":"36","issue":"2","first_page":"153","last_page":"166"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/preconditioner","display_name":"Preconditioner","score":0.8898879289627075},{"id":"https://openalex.org/keywords/massively-parallel","display_name":"Massively parallel","score":0.8063677549362183},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7851617336273193},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7099907398223877},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6881821751594543},{"id":"https://openalex.org/keywords/linear-system","display_name":"Linear system","score":0.5518265962600708},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.4663507044315338},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.459620863199234},{"id":"https://openalex.org/keywords/ideal","display_name":"Ideal (ethics)","score":0.45784610509872437},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4352337718009949},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4223771393299103},{"id":"https://openalex.org/keywords/linear-algebra","display_name":"Linear algebra","score":0.4119229018688202},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.3662392497062683},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.282046914100647},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1491738259792328}],"concepts":[{"id":"https://openalex.org/C167431342","wikidata":"https://www.wikidata.org/wiki/Q1754327","display_name":"Preconditioner","level":3,"score":0.8898879289627075},{"id":"https://openalex.org/C190475519","wikidata":"https://www.wikidata.org/wiki/Q544384","display_name":"Massively parallel","level":2,"score":0.8063677549362183},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7851617336273193},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7099907398223877},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6881821751594543},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.5518265962600708},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4663507044315338},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.459620863199234},{"id":"https://openalex.org/C2776639384","wikidata":"https://www.wikidata.org/wiki/Q840396","display_name":"Ideal (ethics)","level":2,"score":0.45784610509872437},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4352337718009949},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4223771393299103},{"id":"https://openalex.org/C139352143","wikidata":"https://www.wikidata.org/wiki/Q82571","display_name":"Linear algebra","level":2,"score":0.4119229018688202},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.3662392497062683},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.282046914100647},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1491738259792328},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1177/10943420211017188","is_oa":false,"landing_page_url":"https://doi.org/10.1177/10943420211017188","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2010.14175","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2010.14175","pdf_url":"https://arxiv.org/pdf/2010.14175","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2010.14175","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2010.14175","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:3097943479","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2010.14175","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2010.14175","pdf_url":"https://arxiv.org/pdf/2010.14175","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.4399999976158142,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W599829644","https://openalex.org/W1525132831","https://openalex.org/W1845641575","https://openalex.org/W1965034778","https://openalex.org/W1966756606","https://openalex.org/W1979511352","https://openalex.org/W1981220107","https://openalex.org/W1985263109","https://openalex.org/W1987289683","https://openalex.org/W1994805693","https://openalex.org/W2038516134","https://openalex.org/W2062233541","https://openalex.org/W2078311192","https://openalex.org/W2088200553","https://openalex.org/W2089099677","https://openalex.org/W2097979586","https://openalex.org/W2110290705","https://openalex.org/W2156588317","https://openalex.org/W2271597431","https://openalex.org/W2483451257","https://openalex.org/W2767066575","https://openalex.org/W2896944770","https://openalex.org/W2908144813","https://openalex.org/W2944108582","https://openalex.org/W2946073031","https://openalex.org/W2963106000","https://openalex.org/W2963889991","https://openalex.org/W2968917987","https://openalex.org/W2993109347","https://openalex.org/W3000202699","https://openalex.org/W3006501671","https://openalex.org/W3007284522"],"related_works":["https://openalex.org/W3051669108","https://openalex.org/W2965979058","https://openalex.org/W3119799675","https://openalex.org/W2599987010","https://openalex.org/W3005868431","https://openalex.org/W2246456778","https://openalex.org/W2917002098","https://openalex.org/W963568387","https://openalex.org/W3102736503","https://openalex.org/W2071542942","https://openalex.org/W948471287","https://openalex.org/W365641226","https://openalex.org/W2575476607","https://openalex.org/W2893007245","https://openalex.org/W3032663520","https://openalex.org/W3131578829","https://openalex.org/W2005061189","https://openalex.org/W2230867224","https://openalex.org/W3158204061","https://openalex.org/W2949001880"],"abstract_inverted_index":{"The":[0],"solution":[1,23],"of":[2,5,14,24,30,43,60,115,132],"linear":[3,25,167],"systems":[4,26],"equations":[6],"is":[7,63,138],"a":[8,12,36,111,122,140,162],"central":[9],"task":[10],"in":[11,39,94,134,161,165],"number":[13],"scientific":[15,44],"and":[16,45,91,159],"engineering":[17],"applications.":[18],"In":[19,97],"many":[20],"cases":[21],"the":[22,31,40,152],"may":[27],"take":[28],"most":[29],"simulation":[32],"time":[33],"thus":[34],"representing":[35],"major":[37],"bottleneck":[38],"further":[41],"development":[42],"technical":[46],"software.":[47],"For":[48],"large":[49],"scale":[50],"simulations,":[51],"nowadays":[52],"accounting":[53],"for":[54,72],"several":[55],"millions":[56],"or":[57],"even":[58],"billions":[59],"unknowns,":[61],"it":[62],"quite":[64],"common":[65],"to":[66,68,88],"resort":[67],"preconditioned":[69],"iterative":[70],"solvers":[71],"exploiting":[73],"their":[74],"low":[75],"memory":[76,124],"requirements":[77],"and,":[78],"at":[79],"least":[80],"potential,":[81],"parallelism.":[82],"Approximate":[83,106],"inverses":[84],"have":[85],"been":[86],"shown":[87],"be":[89,118],"robust":[90],"effective":[92],"preconditioners":[93,158],"various":[95],"contexts.":[96],"this":[98],"work,":[99],"we":[100,144],"show":[101,145],"how":[102,151],"adaptive":[103,135],"Factored":[104],"Sparse":[105],"Inverse":[107],"(aFSAI),":[108],"characterized":[109],"by":[110],"very":[112],"high":[113],"degree":[114],"parallelism,":[116],"can":[117],"successfully":[119],"implemented":[120],"on":[121],"distributed":[123],"computer":[125],"equipped":[126],"with":[127],"GPU":[128],"accelerators.":[129],"Taking":[130],"advantage":[131],"GPUs":[133],"FSAI":[136],"set-up":[137],"not":[139],"trivial":[141],"task,":[142],"nevertheless":[143],"through":[146],"an":[147],"extensive":[148],"numerical":[149],"experimentation":[150],"proposed":[153],"approach":[154],"outperforms":[155],"more":[156],"traditional":[157],"results":[160],"close-to-ideal":[163],"behavior":[164],"challenging":[166],"algebra":[168],"problems.":[169]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
