{"id":"https://openalex.org/W4385062345","doi":"https://doi.org/10.1109/tc.2023.3296884","title":"Coupled Incomplete Cholesky and Jacobi Preconditioned Conjugate Gradient on the New Generation of Sunway Many-Core Architecture","display_name":"Coupled Incomplete Cholesky and Jacobi Preconditioned Conjugate Gradient on the New Generation of Sunway Many-Core Architecture","publication_year":2023,"publication_date":"2023-07-20","ids":{"openalex":"https://openalex.org/W4385062345","doi":"https://doi.org/10.1109/tc.2023.3296884"},"language":"en","primary_location":{"id":"doi:10.1109/tc.2023.3296884","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tc.2023.3296884","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062453835","display_name":"Yuejin Ye","orcid":"https://orcid.org/0000-0002-2911-8550"},"institutions":[{"id":"https://openalex.org/I4210158984","display_name":"National Supercomputing Center in Wuxi","ror":"https://ror.org/04ypjrs34","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210158984"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuejin Ye","raw_affiliation_strings":["National Supercomputing Center, Wuxi, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputing Center, Wuxi, China","institution_ids":["https://openalex.org/I4210158984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100354395","display_name":"Heng Guo","orcid":"https://orcid.org/0000-0001-8148-0226"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heng Guo","raw_affiliation_strings":["College of Computer Science and Technology, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030293399","display_name":"Bingzhuo Wang","orcid":"https://orcid.org/0009-0003-7507-7299"},"institutions":[{"id":"https://openalex.org/I4210158984","display_name":"National Supercomputing Center in Wuxi","ror":"https://ror.org/04ypjrs34","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210158984"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bingzhuo Wang","raw_affiliation_strings":["National Supercomputing Center, Wuxi, China"],"affiliations":[{"raw_affiliation_string":"National Supercomputing Center, Wuxi, China","institution_ids":["https://openalex.org/I4210158984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073978555","display_name":"P. S. P. Wang","orcid":"https://orcid.org/0000-0002-0060-1514"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengxiao Wang","raw_affiliation_strings":["College of Computer Science and Technology, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056860593","display_name":"Dexun Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dexun Chen","raw_affiliation_strings":["National Research Center of Parallel Computer Engineering &#x0026; Technology, Wuxi, China"],"affiliations":[{"raw_affiliation_string":"National Research Center of Parallel Computer Engineering &#x0026; Technology, Wuxi, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100394179","display_name":"Fang Li","orcid":"https://orcid.org/0000-0002-3555-2126"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang Li","raw_affiliation_strings":["National Research Center of Parallel Computer Engineering &#x0026; Technology, Wuxi, China"],"affiliations":[{"raw_affiliation_string":"National Research Center of Parallel Computer Engineering &#x0026; Technology, Wuxi, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5062453835"],"corresponding_institution_ids":["https://openalex.org/I4210158984"],"apc_list":null,"apc_paid":null,"fwci":0.8157,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.76224731,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":"72","issue":"11","first_page":"3326","last_page":"3339"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cholesky-decomposition","display_name":"Cholesky decomposition","score":0.8101767897605896},{"id":"https://openalex.org/keywords/preconditioner","display_name":"Preconditioner","score":0.7534843683242798},{"id":"https://openalex.org/keywords/conjugate-gradient-method","display_name":"Conjugate gradient method","score":0.6339448690414429},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5709327459335327},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5643146634101868},{"id":"https://openalex.org/keywords/incomplete-cholesky-factorization","display_name":"Incomplete Cholesky factorization","score":0.42377519607543945},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.35500192642211914},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2964943051338196},{"id":"https://openalex.org/keywords/eigenvalues-and-eigenvectors","display_name":"Eigenvalues and eigenvectors","score":0.16732385754585266},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.12293887138366699}],"concepts":[{"id":"https://openalex.org/C34727166","wikidata":"https://www.wikidata.org/wiki/Q515375","display_name":"Cholesky decomposition","level":3,"score":0.8101767897605896},{"id":"https://openalex.org/C167431342","wikidata":"https://www.wikidata.org/wiki/Q1754327","display_name":"Preconditioner","level":3,"score":0.7534843683242798},{"id":"https://openalex.org/C81184566","wikidata":"https://www.wikidata.org/wiki/Q1191895","display_name":"Conjugate gradient method","level":2,"score":0.6339448690414429},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5709327459335327},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5643146634101868},{"id":"https://openalex.org/C44363057","wikidata":"https://www.wikidata.org/wiki/Q6015160","display_name":"Incomplete Cholesky factorization","level":4,"score":0.42377519607543945},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.35500192642211914},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2964943051338196},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.16732385754585266},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.12293887138366699},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tc.2023.3296884","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tc.2023.3296884","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Life below water","score":0.5099999904632568,"id":"https://metadata.un.org/sdg/14"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W105972517","https://openalex.org/W126988573","https://openalex.org/W1525132831","https://openalex.org/W1961414889","https://openalex.org/W1976250820","https://openalex.org/W1981220107","https://openalex.org/W1985923806","https://openalex.org/W2035080386","https://openalex.org/W2066943869","https://openalex.org/W2083380483","https://openalex.org/W2084073638","https://openalex.org/W2095258827","https://openalex.org/W2098528027","https://openalex.org/W2103290518","https://openalex.org/W2122824057","https://openalex.org/W2124192278","https://openalex.org/W2136324023","https://openalex.org/W2157867995","https://openalex.org/W2163304326","https://openalex.org/W2280592497","https://openalex.org/W2318393100","https://openalex.org/W2338973660","https://openalex.org/W2504261469","https://openalex.org/W2551520134","https://openalex.org/W2569133694","https://openalex.org/W2751354592","https://openalex.org/W2767394883","https://openalex.org/W2786704328","https://openalex.org/W2794042324","https://openalex.org/W2794424798","https://openalex.org/W2885034848","https://openalex.org/W2891832717","https://openalex.org/W2899296673","https://openalex.org/W2904093264","https://openalex.org/W2921480401","https://openalex.org/W2999857212","https://openalex.org/W3130892198","https://openalex.org/W4239359156","https://openalex.org/W4293731590","https://openalex.org/W6755985509"],"related_works":["https://openalex.org/W2078637543","https://openalex.org/W2986384163","https://openalex.org/W3022256543","https://openalex.org/W2809896915","https://openalex.org/W2966631139","https://openalex.org/W2063502215","https://openalex.org/W2146296113","https://openalex.org/W2365612721","https://openalex.org/W2887042214","https://openalex.org/W2114781389"],"abstract_inverted_index":{"The":[0,43,143],"Preconditioned":[1],"Conjugate":[2],"Gradient":[3],"method":[4,49,113,165],"is":[5,17,92,152,161],"one":[6],"of":[7,103,158],"the":[8,28,51,63,82,104,120,134,139,148,156,167,175,186,196],"most":[9],"important":[10],"solvers":[11],"in":[12,20,54],"linear":[13],"algebra":[14],"system,":[15],"and":[16,22,39,60,76,117,119,155,181],"widely":[18],"used":[19],"scientific":[21],"engineering":[23],"computing":[24],"applications.":[25],"Based":[26],"on":[27,66,81,114,125,133,195],"Sunway":[29,83,105,197],"heterogeneous":[30,84,106],"many-core":[31,85,107],"architecture,":[32],"we":[33],"propose":[34],"a":[35,46,71,88],"Coupled":[36],"Incomplete":[37],"Cholesky":[38,178],"Jacobi":[40,48],"preconditioner":[41,44,179,190],"(CICJ).":[42],"applies":[45],"block":[47],"to":[50],"matrix":[52,58,149],"inversion":[53],"preconditioning":[55],"process,":[56],"localizes":[57],"inversions":[59],"completely":[61],"eliminates":[62],"data":[64],"correlation":[65],"slave":[67],"cores.":[68],"It":[69],"strikes":[70],"better":[72],"trade-off":[73],"between":[74],"convergence":[75],"parallelism":[77],"than":[78],"other":[79],"preconditioners":[80],"architecture.":[86,108],"Besides,":[87],"two-level":[89],"software-controlled":[90],"cache":[91],"designed":[93],"for":[94],"sparse":[95],"matrix-vector":[96],"multiplication":[97],"operations,":[98],"which":[99],"makes":[100],"full":[101],"use":[102],"We":[109,129],"apply":[110],"our":[111,164],"CICJ":[112],"Intel,":[115],"GPU,":[116],"Sunway,":[118],"results":[121,144],"show":[122,145],"great":[123],"generality":[124],"all":[126],"three":[127],"architectures.":[128],"also":[130],"conduct":[131],"experiments":[132],"underwater":[135],"submarine":[136],"models":[137],"using":[138,192],"open-source":[140],"framework":[141],"OpenFOAM.":[142],"that":[146],"when":[147],"column":[150],"size":[151],"0.82":[153],"billion":[154],"number":[157],"non-zero":[159],"values":[160],"59":[162],"billion,":[163],"accelerates":[166],"whole":[168],"algorithm":[169],"by":[170],"8.42":[171],"times":[172,183],"compared":[173,184],"with":[174,185],"diagonal":[176],"incomplete":[177],"(DIC)":[180],"6.5":[182],"geometric":[187],"algebraic":[188],"multi-grid":[189],"(GAMG)":[191],"133,120":[193],"processors":[194],"system.":[198]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2026-03-04T09:10:02.777135","created_date":"2025-10-10T00:00:00"}
