{"id":"https://openalex.org/W3131379896","doi":"https://doi.org/10.1145/3437801.3441581","title":"Sparta","display_name":"Sparta","publication_year":2021,"publication_date":"2021-02-17","ids":{"openalex":"https://openalex.org/W3131379896","doi":"https://doi.org/10.1145/3437801.3441581","mag":"3131379896"},"language":"en","primary_location":{"id":"doi:10.1145/3437801.3441581","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3437801.3441581","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 26th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100617624","display_name":"Jiawen Liu","orcid":"https://orcid.org/0000-0001-8673-1514"},"institutions":[{"id":"https://openalex.org/I2803209242","display_name":"University of California System","ror":"https://ror.org/00pjdza24","country_code":"US","type":"education","lineage":["https://openalex.org/I2803209242"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jiawen Liu","raw_affiliation_strings":["University of California"],"affiliations":[{"raw_affiliation_string":"University of California","institution_ids":["https://openalex.org/I2803209242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056482728","display_name":"Jie Ren","orcid":"https://orcid.org/0000-0001-5541-433X"},"institutions":[{"id":"https://openalex.org/I2803209242","display_name":"University of California System","ror":"https://ror.org/00pjdza24","country_code":"US","type":"education","lineage":["https://openalex.org/I2803209242"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jie Ren","raw_affiliation_strings":["University of California"],"affiliations":[{"raw_affiliation_string":"University of California","institution_ids":["https://openalex.org/I2803209242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075909942","display_name":"Roberto Gioiosa","orcid":"https://orcid.org/0000-0001-9430-2656"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Roberto Gioiosa","raw_affiliation_strings":["Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100407387","display_name":"Dong Li","orcid":"https://orcid.org/0000-0001-9336-0694"},"institutions":[{"id":"https://openalex.org/I2803209242","display_name":"University of California System","ror":"https://ror.org/00pjdza24","country_code":"US","type":"education","lineage":["https://openalex.org/I2803209242"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dong Li","raw_affiliation_strings":["University of California"],"affiliations":[{"raw_affiliation_string":"University of California","institution_ids":["https://openalex.org/I2803209242"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100454305","display_name":"Jiajia Li","orcid":"https://orcid.org/0000-0003-1270-4147"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiajia Li","raw_affiliation_strings":["Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100617624"],"corresponding_institution_ids":["https://openalex.org/I2803209242"],"apc_list":null,"apc_paid":null,"fwci":4.1451,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.94446198,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"318","last_page":"333"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.973800003528595,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.771075963973999},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.688668429851532},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.658771276473999},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5501705408096313},{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.5334503650665283},{"id":"https://openalex.org/keywords/dram","display_name":"Dram","score":0.5291455388069153},{"id":"https://openalex.org/keywords/sparse-approximation","display_name":"Sparse approximation","score":0.4913696348667145},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.47895553708076477},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.4749598503112793},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.429138720035553},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.4224259853363037},{"id":"https://openalex.org/keywords/accumulator","display_name":"Accumulator (cryptography)","score":0.4167688488960266},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.41394302248954773},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4069211483001709},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3637150824069977},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.20431196689605713},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1434800922870636},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.14000648260116577}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.771075963973999},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.688668429851532},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.658771276473999},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5501705408096313},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.5334503650665283},{"id":"https://openalex.org/C7366592","wikidata":"https://www.wikidata.org/wiki/Q1255620","display_name":"Dram","level":2,"score":0.5291455388069153},{"id":"https://openalex.org/C124066611","wikidata":"https://www.wikidata.org/wiki/Q28684319","display_name":"Sparse approximation","level":2,"score":0.4913696348667145},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.47895553708076477},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.4749598503112793},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.429138720035553},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.4224259853363037},{"id":"https://openalex.org/C2078106","wikidata":"https://www.wikidata.org/wiki/Q14906620","display_name":"Accumulator (cryptography)","level":2,"score":0.4167688488960266},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.41394302248954773},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4069211483001709},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3637150824069977},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.20431196689605713},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1434800922870636},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.14000648260116577},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3437801.3441581","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3437801.3441581","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 26th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4099999964237213,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W1493774699","https://openalex.org/W1506547947","https://openalex.org/W1511885491","https://openalex.org/W1839329870","https://openalex.org/W1991740738","https://openalex.org/W1993079359","https://openalex.org/W2006973305","https://openalex.org/W2007259720","https://openalex.org/W2047547750","https://openalex.org/W2054658678","https://openalex.org/W2061014792","https://openalex.org/W2089196182","https://openalex.org/W2093135480","https://openalex.org/W2095249664","https://openalex.org/W2104305170","https://openalex.org/W2127226421","https://openalex.org/W2139397769","https://openalex.org/W2143119605","https://openalex.org/W2155694951","https://openalex.org/W2234552091","https://openalex.org/W2235832317","https://openalex.org/W2292369231","https://openalex.org/W2340522713","https://openalex.org/W2410461480","https://openalex.org/W2411765360","https://openalex.org/W2471966094","https://openalex.org/W2481767403","https://openalex.org/W2523003201","https://openalex.org/W2541878878","https://openalex.org/W2557840067","https://openalex.org/W2560878429","https://openalex.org/W2582107166","https://openalex.org/W2590246587","https://openalex.org/W2604595776","https://openalex.org/W2604652149","https://openalex.org/W2616934551","https://openalex.org/W2620550288","https://openalex.org/W2727953781","https://openalex.org/W2731053425","https://openalex.org/W2741701794","https://openalex.org/W2751658790","https://openalex.org/W2788854599","https://openalex.org/W2891431244","https://openalex.org/W2902783593","https://openalex.org/W2903504144","https://openalex.org/W2904295992","https://openalex.org/W2914097545","https://openalex.org/W2915032613","https://openalex.org/W2934584470","https://openalex.org/W2951178714","https://openalex.org/W2964051974","https://openalex.org/W2964336816","https://openalex.org/W2970435804","https://openalex.org/W2971508019","https://openalex.org/W2985039650","https://openalex.org/W2986686333","https://openalex.org/W3099762987","https://openalex.org/W3101321165","https://openalex.org/W3103902563","https://openalex.org/W3105364241","https://openalex.org/W3105937213","https://openalex.org/W3131683382","https://openalex.org/W3157864729","https://openalex.org/W4237249260","https://openalex.org/W4248445937","https://openalex.org/W6729203000","https://openalex.org/W6785921489","https://openalex.org/W6917257265"],"related_works":["https://openalex.org/W2293771254","https://openalex.org/W4221142455","https://openalex.org/W3121828480","https://openalex.org/W2039875226","https://openalex.org/W2914631005","https://openalex.org/W2032786851","https://openalex.org/W2952630098","https://openalex.org/W3132517792","https://openalex.org/W4285148873","https://openalex.org/W2062240003"],"abstract_inverted_index":{"Sparse":[0],"tensor":[1,13,103],"contractions":[2],"appear":[3],"commonly":[4],"in":[5],"many":[6],"applications.":[7],"Efficiently":[8],"computing":[9],"a":[10,137,143],"two":[11],"sparse":[12,25,102,106],"product":[14],"is":[15],"challenging:":[16],"It":[17],"not":[18],"only":[19],"inherits":[20],"the":[21,62,77,100,123],"challenges":[22,43],"from":[23],"common":[24],"matrix-matrix":[26],"multiplication":[27],"(SpGEMM),":[28],"i.e.,":[29],"indirect":[30],"memory":[31,113,125],"access":[32],"and":[33,54,57,79,83,112,128,148,159],"unknown":[34],"output":[35,58],"size":[36],"before":[37],"computation,":[38],"but":[39],"also":[40],"raises":[41],"new":[42],"because":[44],"of":[45,48],"high":[46],"dimensionality":[47],"tensors,":[49],"expensive":[50],"multi-dimensional":[51],"index":[52],"search,":[53],"massive":[55],"intermediate":[56],"data.":[59],"To":[60],"address":[61],"above":[63],"challenges,":[64],"we":[65,90],"introduce":[66],"three":[67],"optimization":[68],"techniques":[69],"by":[70,150],"using":[71],"multi-dimensional,":[72],"efficient":[73],"hashtable":[74],"representation":[75],"for":[76],"accumulator":[78],"larger":[80],"input":[81],"tensor,":[82],"all-stage":[84],"parallelization.":[85],"Evaluating":[86],"with":[87,105,126],"15":[88],"datasets,":[89],"show":[91],"that":[92],"Sparta":[93,117],"brings":[94,118],"28":[95],"--":[96],"576\u00d7":[97],"speedup":[98],"over":[99,136],"traditional":[101],"contraction":[104],"accumulator.":[107],"With":[108],"our":[109],"proposed":[110],"algorithm-":[111],"heterogeneity-aware":[114],"data":[115,140,145],"management,":[116],"extra":[119],"performance":[120],"improvement":[121],"on":[122],"heterogeneous":[124],"DRAM":[127],"Intel":[129],"Optane":[130],"DC":[131],"Persistent":[132],"Memory":[133],"Module":[134],"(PMM)":[135],"state-of-the-art":[138],"software-based":[139],"management":[141,146],"solution,":[142,147],"hardware-based":[144],"PMM-only":[149],"30.7%":[151],"(up":[152,156,161],"to":[153,157,162],"98.5%),":[154],"10.7%":[155],"28.3%)":[158],"17%":[160],"65.1%)":[163],"respectively.":[164]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":4}],"updated_date":"2026-02-25T08:12:03.925757","created_date":"2021-03-01T00:00:00"}
