{"id":"https://openalex.org/W3082025233","doi":"https://doi.org/10.1587/transinf.2019edp7265","title":"Block Randomized Singular Value Decomposition on GPUs","display_name":"Block Randomized Singular Value Decomposition on GPUs","publication_year":2020,"publication_date":"2020-08-31","ids":{"openalex":"https://openalex.org/W3082025233","doi":"https://doi.org/10.1587/transinf.2019edp7265","mag":"3082025233"},"language":"en","primary_location":{"id":"doi:10.1587/transinf.2019edp7265","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2019edp7265","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E103.D/9/E103.D_2019EDP7265/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://www.jstage.jst.go.jp/article/transinf/E103.D/9/E103.D_2019EDP7265/_pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028535856","display_name":"Yuechao Lu","orcid":"https://orcid.org/0000-0002-8808-1559"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yuechao LU","raw_affiliation_strings":["Graduate School of Information Science and Technology, Osaka University"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, Osaka University","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033986386","display_name":"Yasuyuki Matsushita","orcid":"https://orcid.org/0000-0002-1935-4752"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yasuyuki MATSUSHITA","raw_affiliation_strings":["Graduate School of Information Science and Technology, Osaka University"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, Osaka University","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090008684","display_name":"Fumihiko Ino","orcid":"https://orcid.org/0000-0002-5757-7631"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Fumihiko INO","raw_affiliation_strings":["Graduate School of Information Science and Technology, Osaka University"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, Osaka University","institution_ids":["https://openalex.org/I98285908"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5028535856"],"corresponding_institution_ids":["https://openalex.org/I98285908"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.10183109,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"E103.D","issue":"9","first_page":"1949","last_page":"1959"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/singular-value-decomposition","display_name":"Singular value decomposition","score":0.8828293681144714},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.8142566680908203},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7928192615509033},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7125846147537231},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6459000706672668},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.606117844581604},{"id":"https://openalex.org/keywords/singular-value","display_name":"Singular value","score":0.5362401008605957},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5337349772453308},{"id":"https://openalex.org/keywords/linear-algebra","display_name":"Linear algebra","score":0.5179163813591003},{"id":"https://openalex.org/keywords/randomized-algorithm","display_name":"Randomized algorithm","score":0.46006929874420166},{"id":"https://openalex.org/keywords/numerical-linear-algebra","display_name":"Numerical linear algebra","score":0.4372597634792328},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3522074520587921},{"id":"https://openalex.org/keywords/linear-system","display_name":"Linear system","score":0.2626735270023346},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10958555340766907}],"concepts":[{"id":"https://openalex.org/C22789450","wikidata":"https://www.wikidata.org/wiki/Q420904","display_name":"Singular value decomposition","level":2,"score":0.8828293681144714},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.8142566680908203},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7928192615509033},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7125846147537231},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6459000706672668},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.606117844581604},{"id":"https://openalex.org/C109282560","wikidata":"https://www.wikidata.org/wiki/Q4166054","display_name":"Singular value","level":3,"score":0.5362401008605957},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5337349772453308},{"id":"https://openalex.org/C139352143","wikidata":"https://www.wikidata.org/wiki/Q82571","display_name":"Linear algebra","level":2,"score":0.5179163813591003},{"id":"https://openalex.org/C128669082","wikidata":"https://www.wikidata.org/wiki/Q583461","display_name":"Randomized algorithm","level":2,"score":0.46006929874420166},{"id":"https://openalex.org/C163834973","wikidata":"https://www.wikidata.org/wiki/Q2004891","display_name":"Numerical linear algebra","level":3,"score":0.4372597634792328},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3522074520587921},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.2626735270023346},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10958555340766907},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1587/transinf.2019edp7265","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2019edp7265","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E103.D/9/E103.D_2019EDP7265/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1587/transinf.2019edp7265","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2019edp7265","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E103.D/9/E103.D_2019EDP7265/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G12401395","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320320912","funder_display_name":"Ministry of Education, Culture, Sports, Science and Technology"},{"id":"https://openalex.org/G8044579487","display_name":null,"funder_award_id":"Japan","funder_id":"https://openalex.org/F4320320912","funder_display_name":"Ministry of Education, Culture, Sports, Science and Technology"}],"funders":[{"id":"https://openalex.org/F4320320912","display_name":"Ministry of Education, Culture, Sports, Science and Technology","ror":"https://ror.org/048rj2z13"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3082025233.pdf","grobid_xml":"https://content.openalex.org/works/W3082025233.grobid-xml"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W1907157228","https://openalex.org/W1964122179","https://openalex.org/W1968691112","https://openalex.org/W1979750072","https://openalex.org/W1982811641","https://openalex.org/W2000274929","https://openalex.org/W2002555321","https://openalex.org/W2005423095","https://openalex.org/W2010747199","https://openalex.org/W2032039029","https://openalex.org/W2033419168","https://openalex.org/W2039472483","https://openalex.org/W2040387238","https://openalex.org/W2045390367","https://openalex.org/W2045977792","https://openalex.org/W2063186542","https://openalex.org/W2071128523","https://openalex.org/W2104373803","https://openalex.org/W2111221242","https://openalex.org/W2115934858","https://openalex.org/W2117293168","https://openalex.org/W2117756735","https://openalex.org/W2118774738","https://openalex.org/W2123921160","https://openalex.org/W2152356156","https://openalex.org/W2154202969","https://openalex.org/W2157237396","https://openalex.org/W2169150754","https://openalex.org/W2294798173","https://openalex.org/W2514696722","https://openalex.org/W2588282852","https://openalex.org/W2609553524","https://openalex.org/W2765887041","https://openalex.org/W2772646190","https://openalex.org/W2900234561","https://openalex.org/W2962717353","https://openalex.org/W3100283647","https://openalex.org/W3100417409","https://openalex.org/W3141650078","https://openalex.org/W4236558082"],"related_works":["https://openalex.org/W4319586039","https://openalex.org/W4382583540","https://openalex.org/W2147072251","https://openalex.org/W1990844505","https://openalex.org/W2148568324","https://openalex.org/W1607100495","https://openalex.org/W4386721910","https://openalex.org/W4378770618","https://openalex.org/W2558792981","https://openalex.org/W2284236008"],"abstract_inverted_index":{"Fast":[0],"computation":[1,71],"of":[2,8,107,147],"singular":[3,93],"value":[4],"decomposition":[5],"(SVD)":[6],"is":[7,61,96],"great":[9],"interest":[10],"in":[11,28,99,117,145],"various":[12],"machine":[13],"learning":[14],"tasks.":[15],"Recently,":[16],"SVD":[17,85,143],"methods":[18,144],"based":[19],"on":[20],"randomized":[21,80,84,142],"linear":[22],"algebra":[23],"have":[24,41],"shown":[25],"significant":[26],"speedup":[27],"this":[29],"regime.":[30],"For":[31],"processing":[32],"large-scale":[33,115],"data,":[34],"computing":[35,109],"systems":[36],"with":[37,90,149],"accelerators":[38],"like":[39],"GPUs":[40],"become":[42],"the":[43,51,55,70,105,130],"mainstream":[44],"approach.":[45],"In":[46],"those":[47],"systems,":[48],"access":[49],"to":[50,63,68,136],"input":[52],"data":[53,116,134],"dominates":[54],"overall":[56],"process":[57],"time;":[58],"therefore,":[59],"it":[60],"needed":[62],"design":[64],"an":[65,77],"out-of-core":[66,121],"algorithm":[67],"dispatch":[69],"into":[72],"accelerators.":[73],"This":[74],"paper":[75],"proposes":[76],"accurate":[78],"two-pass":[79],"SVD,":[81],"named":[82],"block":[83],"(BRSVD),":[86],"designed":[87],"for":[88],"matrices":[89],"a":[91,118],"slow-decay":[92],"spectrum":[94],"that":[95,126,139],"often":[97],"observed":[98],"image":[100],"data.":[101],"BRSVD":[102,127],"fully":[103],"utilizes":[104],"power":[106],"modern":[108],"system":[110],"architectures":[111],"and":[112,120],"efficiently":[113],"processes":[114],"parallel":[119],"fashion.":[122],"Our":[123],"experiments":[124],"show":[125],"effectively":[128],"moves":[129],"performance":[131],"bottleneck":[132],"from":[133],"transfer":[135],"computation,":[137],"so":[138],"outperforms":[140],"existing":[141],"terms":[146],"speed":[148],"retaining":[150],"similar":[151],"accuracy.":[152]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2025-10-10T00:00:00"}
