{"id":"https://openalex.org/W4391053464","doi":"https://doi.org/10.1145/3635035.3635039","title":"Task-based low-rank hybrid parallel Cholesky factorization for distributed memory environment","display_name":"Task-based low-rank hybrid parallel Cholesky factorization for distributed memory environment","publication_year":2024,"publication_date":"2024-01-18","ids":{"openalex":"https://openalex.org/W4391053464","doi":"https://doi.org/10.1145/3635035.3635039"},"language":"en","primary_location":{"id":"doi:10.1145/3635035.3635039","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3635035.3635039","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference on High Performance Computing in Asia-Pacific Region","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093752436","display_name":"Han Jiao","orcid":"https://orcid.org/0009-0005-1262-2071"},"institutions":[{"id":"https://openalex.org/I66906201","display_name":"University of Yamanashi","ror":"https://ror.org/059x21724","country_code":"JP","type":"education","lineage":["https://openalex.org/I66906201"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Han Jiao","raw_affiliation_strings":["University of Yamanashi, Japan"],"raw_orcid":"https://orcid.org/0009-0005-1262-2071","affiliations":[{"raw_affiliation_string":"University of Yamanashi, Japan","institution_ids":["https://openalex.org/I66906201"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100624323","display_name":"Jilin Zhang","orcid":"https://orcid.org/0000-0003-0241-0727"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jilin Zhang","raw_affiliation_strings":["Hangzhou Dianzi University, China"],"raw_orcid":"https://orcid.org/0000-0003-0241-0727","affiliations":[{"raw_affiliation_string":"Hangzhou Dianzi University, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056237192","display_name":"Tomohiro Suzuki","orcid":"https://orcid.org/0000-0002-3091-1302"},"institutions":[{"id":"https://openalex.org/I66906201","display_name":"University of Yamanashi","ror":"https://ror.org/059x21724","country_code":"JP","type":"education","lineage":["https://openalex.org/I66906201"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomohiro Suzuki","raw_affiliation_strings":["University of Yamanashi, Japan"],"raw_orcid":"https://orcid.org/0000-0002-3091-1302","affiliations":[{"raw_affiliation_string":"University of Yamanashi, Japan","institution_ids":["https://openalex.org/I66906201"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5093752436"],"corresponding_institution_ids":["https://openalex.org/I66906201"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00565947,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"107","last_page":"116"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8865896463394165},{"id":"https://openalex.org/keywords/cholesky-decomposition","display_name":"Cholesky decomposition","score":0.8388577699661255},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.741978108882904},{"id":"https://openalex.org/keywords/task-parallelism","display_name":"Task parallelism","score":0.5379015207290649},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.514207124710083},{"id":"https://openalex.org/keywords/shared-memory","display_name":"Shared memory","score":0.4692782163619995},{"id":"https://openalex.org/keywords/memory-footprint","display_name":"Memory footprint","score":0.4547405242919922},{"id":"https://openalex.org/keywords/distributed-memory","display_name":"Distributed memory","score":0.423638254404068},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.42244553565979004},{"id":"https://openalex.org/keywords/factorization","display_name":"Factorization","score":0.4179916977882385},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.41133761405944824},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.40208256244659424},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3289737105369568},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.23504340648651123},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.14601990580558777},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.09181791543960571}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8865896463394165},{"id":"https://openalex.org/C34727166","wikidata":"https://www.wikidata.org/wiki/Q515375","display_name":"Cholesky decomposition","level":3,"score":0.8388577699661255},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.741978108882904},{"id":"https://openalex.org/C42992933","wikidata":"https://www.wikidata.org/wiki/Q691169","display_name":"Task parallelism","level":3,"score":0.5379015207290649},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.514207124710083},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.4692782163619995},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.4547405242919922},{"id":"https://openalex.org/C91481028","wikidata":"https://www.wikidata.org/wiki/Q1054686","display_name":"Distributed memory","level":3,"score":0.423638254404068},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.42244553565979004},{"id":"https://openalex.org/C187834632","wikidata":"https://www.wikidata.org/wiki/Q188804","display_name":"Factorization","level":2,"score":0.4179916977882385},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.41133761405944824},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.40208256244659424},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3289737105369568},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.23504340648651123},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.14601990580558777},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.09181791543960571},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3635035.3635039","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3635035.3635039","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference on High Performance Computing in Asia-Pacific Region","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3481866935","display_name":null,"funder_award_id":"19H04127","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3541693721","display_name":null,"funder_award_id":"62072146","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6306364297","display_name":null,"funder_award_id":"2021C03187","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1968376936","https://openalex.org/W2018419001","https://openalex.org/W2121893797","https://openalex.org/W2159994240","https://openalex.org/W2160774872","https://openalex.org/W2612290557","https://openalex.org/W2766943539","https://openalex.org/W2782745921","https://openalex.org/W2887881931","https://openalex.org/W2889256647","https://openalex.org/W2963450965","https://openalex.org/W2966353369","https://openalex.org/W2995553094","https://openalex.org/W3019767051","https://openalex.org/W3036007422","https://openalex.org/W3211122343","https://openalex.org/W4211092082","https://openalex.org/W4292565208"],"related_works":["https://openalex.org/W2026512611","https://openalex.org/W1985165680","https://openalex.org/W4245497162","https://openalex.org/W2353146130","https://openalex.org/W2354572819","https://openalex.org/W1990817968","https://openalex.org/W2150064838","https://openalex.org/W1933089384","https://openalex.org/W2185094550","https://openalex.org/W2088823210"],"abstract_inverted_index":{"The":[0],"primary":[1],"targets":[2],"for":[3,6,43,56,71,79],"improving":[4,21],"efficiency":[5],"large-scale":[7],"matrix":[8],"factorization":[9,110],"are":[10],"reducing":[11],"synchronization,":[12],"addressing":[13],"the":[14,122,136,141],"overlap":[15],"in":[16,32,60,81,111],"communication":[17,93],"and":[18,20,69,102,115,131,134,138],"computation,":[19],"load":[22],"balance.":[23],"In":[24,95],"recent":[25],"years,":[26],"tiled":[27],"algorithms":[28],"with":[29,67,91],"task":[30,100],"parallelism":[31,101],"multicore":[33],"shared":[34],"memory":[35,73],"systems":[36,74],"have":[37],"become":[38],"well-established":[39],"as":[40],"efficient":[41],"methods":[42],"conducting":[44],"fine-grained":[45],"computations":[46],"on":[47,127],"smaller":[48],"tiles.":[49],"Moreover,":[50],"they":[51],"provide":[52],"flexible":[53],"execution":[54],"orders":[55],"a":[57,76,106,112],"runtime":[58],"system":[59],"many":[61],"situations.":[62],"However,":[63],"traditional":[64],"hybrid":[65,107],"programs":[66,126],"MPI":[68],"OpenMP":[70],"distributed":[72,113],"use":[75],"fork-join":[77],"model":[78],"multi-threads":[80],"each":[82],"process,":[83],"which":[84],"leads":[85],"to":[86],"thread-parallel":[87],"computing":[88],"tasks":[89],"interchange":[90],"sequential":[92],"tasks.":[94],"this":[96],"paper,":[97],"we":[98],"incorporate":[99],"low-rank":[103,118,132],"approximation":[104],"into":[105],"task-based":[108],"Cholesky":[109],"environment":[114],"propose":[116],"some":[117],"variants.":[119],"We":[120],"evaluate":[121],"performance":[123],"of":[124,140],"our":[125],"both":[128],"full-rank":[129],"inputs":[130,133],"report":[135],"pros":[137],"cons":[139],"proposed":[142],"programs.":[143]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
