{"id":"https://openalex.org/W3186081252","doi":"https://doi.org/10.3390/a14070204","title":"A Comparative Study of Block Incomplete Sparse Approximate Inverses Preconditioning on Tesla K20 and V100 GPUs","display_name":"A Comparative Study of Block Incomplete Sparse Approximate Inverses Preconditioning on Tesla K20 and V100 GPUs","publication_year":2021,"publication_date":"2021-06-30","ids":{"openalex":"https://openalex.org/W3186081252","doi":"https://doi.org/10.3390/a14070204","mag":"3186081252"},"language":"en","primary_location":{"id":"doi:10.3390/a14070204","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a14070204","pdf_url":"https://www.mdpi.com/1999-4893/14/7/204/pdf?version=1625133748","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/1999-4893/14/7/204/pdf?version=1625133748","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110665483","display_name":"Wenpeng Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I130750295","display_name":"Xinyang Normal University","ror":"https://ror.org/0190x2a66","country_code":"CN","type":"education","lineage":["https://openalex.org/I130750295"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenpeng Ma","raw_affiliation_strings":["School of Computer and Information Technology, Xinyang Normal University, Xinyang 464000, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Xinyang Normal University, Xinyang 464000, China","institution_ids":["https://openalex.org/I130750295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115596406","display_name":"Yuan Wu","orcid":"https://orcid.org/0000-0001-9107-2197"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210108629","display_name":"Computer Network Information Center","ror":"https://ror.org/01s0wyf50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210108629"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wu Yuan","raw_affiliation_strings":["Computer Network Information Center, Chinese Academy of Sciences, Beijing 100190, China"],"affiliations":[{"raw_affiliation_string":"Computer Network Information Center, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210108629","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070790173","display_name":"Xiazhen Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210108629","display_name":"Computer Network Information Center","ror":"https://ror.org/01s0wyf50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210108629"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiazhen Liu","raw_affiliation_strings":["Computer Network Information Center, Chinese Academy of Sciences, Beijing 100190, China"],"affiliations":[{"raw_affiliation_string":"Computer Network Information Center, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210108629","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110665483"],"corresponding_institution_ids":["https://openalex.org/I130750295"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1362646,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":"7","first_page":"204","last_page":"204"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10339","display_name":"Advanced Numerical Methods in Computational Mathematics","score":0.9832000136375427,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/preconditioner","display_name":"Preconditioner","score":0.7538442611694336},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7071399092674255},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6912893652915955},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.649323046207428},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.4116535782814026},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.35075122117996216},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.22382771968841553},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21932101249694824},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.10615405440330505},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09208288788795471}],"concepts":[{"id":"https://openalex.org/C167431342","wikidata":"https://www.wikidata.org/wiki/Q1754327","display_name":"Preconditioner","level":3,"score":0.7538442611694336},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7071399092674255},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6912893652915955},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.649323046207428},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.4116535782814026},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.35075122117996216},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.22382771968841553},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21932101249694824},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.10615405440330505},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09208288788795471},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/a14070204","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a14070204","pdf_url":"https://www.mdpi.com/1999-4893/14/7/204/pdf?version=1625133748","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:e0d03316da4942b1b601a9d755d20f20","is_oa":true,"landing_page_url":"https://doaj.org/article/e0d03316da4942b1b601a9d755d20f20","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms, Vol 14, Iss 7, p 204 (2021)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/1999-4893/14/7/204/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/a14070204","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms; Volume 14; Issue 7; Pages: 204","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/a14070204","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a14070204","pdf_url":"https://www.mdpi.com/1999-4893/14/7/204/pdf?version=1625133748","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G19332936","display_name":null,"funder_award_id":"61702438","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8715688735","display_name":null,"funder_award_id":"2019YFB1704202","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3186081252.pdf","grobid_xml":"https://content.openalex.org/works/W3186081252.grobid-xml"},"referenced_works_count":26,"referenced_works":["https://openalex.org/W1506342804","https://openalex.org/W1965034778","https://openalex.org/W1981367360","https://openalex.org/W1994805693","https://openalex.org/W2035080386","https://openalex.org/W2049664825","https://openalex.org/W2095258827","https://openalex.org/W2140153041","https://openalex.org/W2151819818","https://openalex.org/W2181846018","https://openalex.org/W2252346314","https://openalex.org/W2290916141","https://openalex.org/W2406344247","https://openalex.org/W2469975815","https://openalex.org/W2519968131","https://openalex.org/W2544527082","https://openalex.org/W2557929373","https://openalex.org/W2741907101","https://openalex.org/W2767023738","https://openalex.org/W2767066575","https://openalex.org/W2900987589","https://openalex.org/W2993109347","https://openalex.org/W2996917989","https://openalex.org/W3100838950","https://openalex.org/W3165049063","https://openalex.org/W6659374036"],"related_works":["https://openalex.org/W2357336958","https://openalex.org/W4281839678","https://openalex.org/W2535797495","https://openalex.org/W152950973","https://openalex.org/W2300963337","https://openalex.org/W2029210135","https://openalex.org/W2047866757","https://openalex.org/W3202552726","https://openalex.org/W1592977960","https://openalex.org/W4388736814"],"abstract_inverted_index":{"Incomplete":[0],"Sparse":[1],"Approximate":[2],"Inverses":[3],"(ISAI)":[4],"has":[5],"shown":[6],"some":[7],"advantages":[8],"over":[9,97],"sparse":[10],"triangular":[11,101],"solves":[12,102],"on":[13,70,77],"GPUs":[14,38,74,83,131],"when":[15],"it":[16],"is":[17,125],"used":[18],"for":[19,34,107],"the":[20,30,46,50,57,98,104,108,111,118],"incomplete":[21],"LU":[22],"based":[23,100],"preconditioner.":[24],"In":[25,56],"this":[26],"paper,":[27],"we":[28],"extend":[29],"single":[31],"GPU":[32],"method":[33],"Block\u2013ISAI":[35,69,92,116],"to":[36,72,133],"multiple":[37],"algorithm":[39],"by":[40],"coupling":[41],"Block\u2013Jacobi":[42,89],"preconditioner,":[43],"and":[44,64,86,110,117],"introduce":[45],"detailed":[47],"implementation":[48],"in":[49],"open":[51],"source":[52],"numerical":[53],"package":[54],"PETSc.":[55],"experiments,":[58],"two":[59,78],"representative":[60],"cases":[61],"are":[62,75],"performed":[63],"a":[65],"comparative":[66],"study":[67],"of":[68,81,113,123],"up":[71,115],"four":[73],"conducted":[76],"major":[79],"generations":[80],"NVIDIA\u2019s":[82],"(Tesla":[84],"K20":[85,135],"Tesla":[87,129,134],"V100).":[88],"preconditioning":[90],"with":[91],"(BJPB-ISAI)":[93],"shows":[94],"an":[95],"advantage":[96],"level-scheduling":[99],"from":[103],"cuSPARSE":[105],"library":[106],"cases,":[109],"overhead":[112],"setting":[114],"total":[119],"wall":[120],"clock":[121],"times":[122],"GMRES":[124],"greatly":[126],"reduced":[127],"using":[128],"V100":[130],"compared":[132],"GPUs.":[136]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
