{"id":"https://openalex.org/W4382048437","doi":"https://doi.org/10.1145/3592979.3593413","title":"Mixed-Precision Random Projection for RandNLA on Tensor Cores","display_name":"Mixed-Precision Random Projection for RandNLA on Tensor Cores","publication_year":2023,"publication_date":"2023-06-26","ids":{"openalex":"https://openalex.org/W4382048437","doi":"https://doi.org/10.1145/3592979.3593413"},"language":"en","primary_location":{"id":"doi:10.1145/3592979.3593413","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3592979.3593413","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Platform for Advanced Scientific Computing Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071124999","display_name":"Hiroyuki Ootomo","orcid":"https://orcid.org/0000-0002-9522-3789"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Hiroyuki Ootomo","raw_affiliation_strings":["Tokyo Institute of Technology, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024747717","display_name":"Rio Yokota","orcid":"https://orcid.org/0000-0001-7573-7873"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Rio Yokota","raw_affiliation_strings":["Tokyo Institute of Technology, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5071124999"],"corresponding_institution_ids":["https://openalex.org/I114531698"],"apc_list":null,"apc_paid":null,"fwci":0.6319,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.6109134,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/random-projection","display_name":"Random projection","score":0.8401645421981812},{"id":"https://openalex.org/keywords/projection","display_name":"Projection (relational algebra)","score":0.6310893297195435},{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.6231475472450256},{"id":"https://openalex.org/keywords/singular-value-decomposition","display_name":"Singular value decomposition","score":0.5823850631713867},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.5699975490570068},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5621718168258667},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5496373176574707},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.5320706367492676},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5129873156547546},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.4907287359237671},{"id":"https://openalex.org/keywords/multiplication","display_name":"Multiplication (music)","score":0.488810271024704},{"id":"https://openalex.org/keywords/random-matrix","display_name":"Random matrix","score":0.46589505672454834},{"id":"https://openalex.org/keywords/numerical-linear-algebra","display_name":"Numerical linear algebra","score":0.46446532011032104},{"id":"https://openalex.org/keywords/dimensionality-reduction","display_name":"Dimensionality reduction","score":0.41788822412490845},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.32827451825141907},{"id":"https://openalex.org/keywords/linear-system","display_name":"Linear system","score":0.2933995723724365},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.17744600772857666}],"concepts":[{"id":"https://openalex.org/C2777036070","wikidata":"https://www.wikidata.org/wiki/Q18393452","display_name":"Random projection","level":2,"score":0.8401645421981812},{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.6310893297195435},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.6231475472450256},{"id":"https://openalex.org/C22789450","wikidata":"https://www.wikidata.org/wiki/Q420904","display_name":"Singular value decomposition","level":2,"score":0.5823850631713867},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.5699975490570068},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5621718168258667},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5496373176574707},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.5320706367492676},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5129873156547546},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.4907287359237671},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.488810271024704},{"id":"https://openalex.org/C64812099","wikidata":"https://www.wikidata.org/wiki/Q176604","display_name":"Random matrix","level":3,"score":0.46589505672454834},{"id":"https://openalex.org/C163834973","wikidata":"https://www.wikidata.org/wiki/Q2004891","display_name":"Numerical linear algebra","level":3,"score":0.46446532011032104},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.41788822412490845},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.32827451825141907},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.2933995723724365},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.17744600772857666},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3592979.3593413","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3592979.3593413","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Platform for Advanced Scientific Computing Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1069223013","display_name":null,"funder_award_id":"JSPS KAKENHI","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G1694571055","display_name":null,"funder_award_id":"JP21H03447","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G193038087","display_name":null,"funder_award_id":"JST CREST","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G2061319648","display_name":null,"funder_award_id":"JP22H0359","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G2792802287","display_name":null,"funder_award_id":"KAKENHI","funder_id":"https://openalex.org/F4320338075","funder_display_name":"Core Research for Evolutional Science and Technology"},{"id":"https://openalex.org/G3282004645","display_name":null,"funder_award_id":"JPMJCR","funder_id":"https://openalex.org/F4320338075","funder_display_name":"Core Research for Evolutional Science and Technology"},{"id":"https://openalex.org/G3459562248","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3938381110","display_name":"\u5341\u548c\u7530\u30ab\u30eb\u30c7\u30e9\u5674\u51fa\u7269\u306e\u706b\u5c71\u5c64\u5e8f\u5b66\u7684\u7814\u7a76","funder_award_id":"23005","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G4227499671","display_name":null,"funder_award_id":"KAKENHI Grant","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G4636223006","display_name":null,"funder_award_id":"JSPS KAK","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5778814166","display_name":null,"funder_award_id":"K2062","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5786340949","display_name":null,"funder_award_id":"KAKENHI Grant Number","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5938650130","display_name":null,"funder_award_id":"21H03447","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G6317729023","display_name":null,"funder_award_id":"22H03598","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G6718509927","display_name":null,"funder_award_id":"CREST","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G6723945271","display_name":"\u76e3\u67fb\u5f79\u304a\u3088\u3073\u4f1a\u8a08\u58eb\u306e\u76e3\u67fb\u5236\u5ea6\u306b\u95a2\u3059\u308b\u7814\u7a76","funder_award_id":"30009","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G720495953","display_name":"Application of Unconventional Linear Algebra Techniques to Continuous Learning in Supergiant Neural Networks","funder_award_id":"20K20624","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7752643416","display_name":null,"funder_award_id":"Japan","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7840269759","display_name":null,"funder_award_id":"JP20K","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G8430481527","display_name":null,"funder_award_id":"Number","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"},{"id":"https://openalex.org/F4320338075","display_name":"Core Research for Evolutional Science and Technology","ror":"https://ror.org/00097mb19"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1583837637","https://openalex.org/W1933407002","https://openalex.org/W1964542748","https://openalex.org/W2004026774","https://openalex.org/W2013912476","https://openalex.org/W2033244207","https://openalex.org/W2037757210","https://openalex.org/W2041836310","https://openalex.org/W2073327480","https://openalex.org/W2090898720","https://openalex.org/W2107599050","https://openalex.org/W2110784778","https://openalex.org/W2117756735","https://openalex.org/W2119233169","https://openalex.org/W2120350343","https://openalex.org/W2121153407","https://openalex.org/W2394933259","https://openalex.org/W2471210720","https://openalex.org/W2491755644","https://openalex.org/W2606722458","https://openalex.org/W2609644570","https://openalex.org/W2747122024","https://openalex.org/W2771019312","https://openalex.org/W2791673912","https://openalex.org/W2792300954","https://openalex.org/W2963718636","https://openalex.org/W2981825520","https://openalex.org/W2990138404","https://openalex.org/W3034986667","https://openalex.org/W3125352309","https://openalex.org/W3127717271","https://openalex.org/W3195265091","https://openalex.org/W3197930963","https://openalex.org/W3201817523","https://openalex.org/W4221160294","https://openalex.org/W4221161761","https://openalex.org/W4280494023","https://openalex.org/W4280590264","https://openalex.org/W4281986533","https://openalex.org/W4319917399","https://openalex.org/W6676220612","https://openalex.org/W6755869844"],"related_works":["https://openalex.org/W2617690415","https://openalex.org/W2962882058","https://openalex.org/W4286233507","https://openalex.org/W4310489806","https://openalex.org/W3047787696","https://openalex.org/W2045648570","https://openalex.org/W2181927120","https://openalex.org/W2964247956","https://openalex.org/W4364387326","https://openalex.org/W4382048437"],"abstract_inverted_index":{"Random":[0,160],"projection":[1,41,62,98,161],"can":[2,152],"reduce":[3,43],"the":[4,44,57,60,111,114,143],"dimension":[5],"of":[6,31,47,50,59],"data":[7,32],"while":[8,172],"capturing":[9],"its":[10,68,89],"structure":[11],"and":[12,22,52,120,129,135,159],"is":[13,63,72,146],"a":[14,28,64,79,94,122],"fundamental":[15],"tool":[16],"for":[17,87,106],"machine":[18],"learning,":[19],"signal":[20],"processing,":[21],"information":[23],"retrieval,":[24],"which":[25],"deal":[26],"with":[27],"large":[29],"amount":[30],"today.":[33],"RandNLA":[34,80],"(Randomized":[35],"Numerical":[36],"Linear":[37],"Algebra)":[38],"leverages":[39],"random":[40,61,97,115,144],"to":[42],"computational":[45,70,90],"complexity":[46,71],"low-rank":[48],"decomposition":[49],"tensors":[51],"solve":[53],"least-square":[54],"problems.":[55],"While":[56],"computation":[58],"simple":[65],"matrix":[66,116,125,145],"multiplication,":[67],"asymptotic":[69],"typically":[73],"larger":[74],"than":[75,168],"other":[76],"operations":[77],"in":[78,148],"algorithm.":[81],"Therefore,":[82],"various":[83],"studies":[84],"propose":[85,93],"methods":[86],"reducing":[88],"complexity.":[91],"We":[92,109],"fast":[95],"mixed-precision":[96],"method":[99,151],"on":[100,139],"NVIDIA":[101],"GPUs":[102],"using":[103],"Tensor":[104,140],"Cores":[105],"single-precision":[107,170],"tensors.":[108],"exploit":[110],"fact":[112],"that":[113],"requires":[117],"less":[118],"precision,":[119],"develop":[121],"highly":[123],"optimized":[124],"multiplication":[126],"between":[127],"FP32":[128],"FP16":[130],"matrices":[131],"-":[132,138],"SHGEMM":[133],"(Single":[134],"Half":[136],"GEMM)":[137],"Cores,":[141],"where":[142],"stored":[147],"FP16.":[149],"Our":[150],"compute":[153],"Randomized":[154],"SVD":[155,164],"1.28":[156],"times":[157,166],"faster":[158,167],"high":[162],"order":[163],"1.75":[165],"baseline":[169],"implementations":[171],"maintaining":[173],"accuracy.":[174]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
