{"id":"https://openalex.org/W4393855615","doi":"https://doi.org/10.1177/10943420241242021","title":"An inherently parallel \u210b<sup>2</sup>-ULV factorization for solving dense linear systems on GPUs","display_name":"An inherently parallel \u210b<sup>2</sup>-ULV factorization for solving dense linear systems on GPUs","publication_year":2024,"publication_date":"2024-04-03","ids":{"openalex":"https://openalex.org/W4393855615","doi":"https://doi.org/10.1177/10943420241242021"},"language":"en","primary_location":{"id":"doi:10.1177/10943420241242021","is_oa":false,"landing_page_url":"https://doi.org/10.1177/10943420241242021","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2502.02395","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040574670","display_name":"Qianxiang Ma","orcid":"https://orcid.org/0000-0003-4688-5644"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Qianxiang Ma","raw_affiliation_strings":["School of Computing, Tokyo Institute of Technology, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"School of Computing, Tokyo Institute of Technology, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024747717","display_name":"Rio Yokota","orcid":"https://orcid.org/0000-0001-7573-7873"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Rio Yokota","raw_affiliation_strings":["Global Scientific Information and Computing Center, Tokyo Institute of Technology, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Global Scientific Information and Computing Center, Tokyo Institute of Technology, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5024747717"],"corresponding_institution_ids":["https://openalex.org/I114531698"],"apc_list":null,"apc_paid":null,"fwci":0.9951,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.72544559,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"38","issue":"4","first_page":"314","last_page":"336"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11263","display_name":"Electromagnetic Simulation and Numerical Methods","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/factorization","display_name":"Factorization","score":0.7424218654632568},{"id":"https://openalex.org/keywords/linear-system","display_name":"Linear system","score":0.46497654914855957},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4338856637477875},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4013461172580719},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.3209499716758728},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.29221469163894653},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.18480154871940613},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.0692797303199768}],"concepts":[{"id":"https://openalex.org/C187834632","wikidata":"https://www.wikidata.org/wiki/Q188804","display_name":"Factorization","level":2,"score":0.7424218654632568},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.46497654914855957},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4338856637477875},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4013461172580719},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.3209499716758728},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29221469163894653},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.18480154871940613},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0692797303199768}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1177/10943420241242021","is_oa":false,"landing_page_url":"https://doi.org/10.1177/10943420241242021","pdf_url":null,"source":{"id":"https://openalex.org/S60606485","display_name":"The International Journal of High Performance Computing Applications","issn_l":"1094-3420","issn":["1094-3420","1741-2846"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of High Performance Computing Applications","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2502.02395","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.02395","pdf_url":"https://arxiv.org/pdf/2502.02395","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2502.02395","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.02395","pdf_url":"https://arxiv.org/pdf/2502.02395","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1069223013","display_name":null,"funder_award_id":"JSPS KAKENHI","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G1694571055","display_name":null,"funder_award_id":"JP21H03447","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G2061319648","display_name":null,"funder_award_id":"JP22H0359","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G2792802287","display_name":null,"funder_award_id":"KAKENHI","funder_id":"https://openalex.org/F4320338075","funder_display_name":"Core Research for Evolutional Science and Technology"},{"id":"https://openalex.org/G3282004645","display_name":null,"funder_award_id":"JPMJCR","funder_id":"https://openalex.org/F4320338075","funder_display_name":"Core Research for Evolutional Science and Technology"},{"id":"https://openalex.org/G3459562248","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3938381110","display_name":"\u5341\u548c\u7530\u30ab\u30eb\u30c7\u30e9\u5674\u51fa\u7269\u306e\u706b\u5c71\u5c64\u5e8f\u5b66\u7684\u7814\u7a76","funder_award_id":"23005","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G4636223006","display_name":null,"funder_award_id":"JSPS KAK","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5778814166","display_name":null,"funder_award_id":"K2062","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5938650130","display_name":null,"funder_award_id":"21H03447","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G6317729023","display_name":null,"funder_award_id":"22H03598","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G6718509927","display_name":null,"funder_award_id":"CREST","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G6723945271","display_name":"\u76e3\u67fb\u5f79\u304a\u3088\u3073\u4f1a\u8a08\u58eb\u306e\u76e3\u67fb\u5236\u5ea6\u306b\u95a2\u3059\u308b\u7814\u7a76","funder_award_id":"30009","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G720495953","display_name":"Application of Unconventional Linear Algebra Techniques to Continuous Learning in Supergiant Neural Networks","funder_award_id":"20K20624","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7752643416","display_name":null,"funder_award_id":"Japan","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7840269759","display_name":null,"funder_award_id":"JP20K","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G8430481527","display_name":null,"funder_award_id":"Number","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"},{"id":"https://openalex.org/F4320338075","display_name":"Core Research for Evolutional Science and Technology","ror":"https://ror.org/00097mb19"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4393855615.pdf"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W36826159","https://openalex.org/W1547507450","https://openalex.org/W2018419001","https://openalex.org/W2036403858","https://openalex.org/W2069045162","https://openalex.org/W2141719776","https://openalex.org/W2160774872","https://openalex.org/W2162322364","https://openalex.org/W2169150754","https://openalex.org/W2298381282","https://openalex.org/W2746683429","https://openalex.org/W2886763336","https://openalex.org/W2962927345","https://openalex.org/W2994914294","https://openalex.org/W2995553094","https://openalex.org/W2999378407","https://openalex.org/W3036007422","https://openalex.org/W3112080169","https://openalex.org/W3114973229","https://openalex.org/W4231150350","https://openalex.org/W4291517469","https://openalex.org/W4321636543","https://openalex.org/W4321636614","https://openalex.org/W4321636779","https://openalex.org/W4384008173"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2935759653","https://openalex.org/W3105167352","https://openalex.org/W54078636","https://openalex.org/W2954470139","https://openalex.org/W1501425562","https://openalex.org/W2902782467","https://openalex.org/W3084825885"],"abstract_inverted_index":{"Hierarchical":[0],"low-rank":[1],"approximation":[2],"of":[3,10,25,70,75,106],"dense":[4,93],"matrices":[5,28,94],"can":[6,39,95],"reduce":[7],"the":[8,22,42,51,68,103,113,120],"complexity":[9],"their":[11,63],"factorization":[12,54],"from":[13],"[Formula:":[14,18,114],"see":[15,19,115],"text]":[16],"to":[17,32,81],"text].":[20],"However,":[21],"complex":[23],"structure":[24],"such":[26],"hierarchical":[27],"makes":[29,78],"them":[30],"difficult":[31],"parallelize.":[33],"The":[34,48,73],"block":[35],"size":[36],"and":[37],"ranks":[38],"vary":[40],"between":[41,50],"sub-blocks,":[43],"which":[44,118],"creates":[45],"load":[46,66],"imbalance.":[47],"dependency":[49,121],"sub-blocks":[52,60],"during":[53],"results":[55],"in":[56],"serialization.":[57],"Since":[58],"many":[59],"are":[61],"low-rank,":[62],"small":[64],"computational":[65],"exposes":[67],"overhead":[69],"runtime":[71],"systems.":[72],"combination":[74],"these":[76,83],"factors":[77],"it":[79],"challenging":[80],"implement":[82],"methods":[84],"on":[85,122],"GPUs.":[86,107],"In":[87],"this":[88],"work,":[89],"we":[90],"show":[91],"that":[92],"be":[96],"factorized":[97],"with":[98],"linear":[99],"complexity,":[100],"while":[101],"extracting":[102],"potential":[104],"parallelism":[105],"This":[108],"is":[109],"made":[110],"possible":[111],"through":[112],"text]-ULV":[116],"factorization,":[117],"removes":[119],"trailing":[123],"sub-matrices.":[124]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2024-04-04T00:00:00"}
