{"id":"https://openalex.org/W4318540786","doi":"https://doi.org/10.1145/3575693.3575706","title":"Spada: Accelerating Sparse Matrix Multiplication with Adaptive Dataflow","display_name":"Spada: Accelerating Sparse Matrix Multiplication with Adaptive Dataflow","publication_year":2023,"publication_date":"2023-01-27","ids":{"openalex":"https://openalex.org/W4318540786","doi":"https://doi.org/10.1145/3575693.3575706"},"language":"en","primary_location":{"id":"doi:10.1145/3575693.3575706","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3575693.3575706","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3575693.3575706","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 2","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3575693.3575706","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041436760","display_name":"Zhiyao Li","orcid":"https://orcid.org/0000-0001-5751-7607"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyao Li","raw_affiliation_strings":["Tsinghua University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085926712","display_name":"Jiaxiang Li","orcid":"https://orcid.org/0000-0003-0478-1409"},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiaxiang Li","raw_affiliation_strings":["Northwestern University, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern University, USA","institution_ids":["https://openalex.org/I111979921"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001410614","display_name":"Taijie Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Taijie Chen","raw_affiliation_strings":["Tsinghua University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068606980","display_name":"Dimin Niu","orcid":"https://orcid.org/0000-0001-8440-3875"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dimin Niu","raw_affiliation_strings":["Alibaba DAMO Academy, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba DAMO Academy, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046896624","display_name":"Hongzhong Zheng","orcid":"https://orcid.org/0000-0001-7696-9799"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongzhong Zheng","raw_affiliation_strings":["Alibaba DAMO Academy, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba DAMO Academy, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100385336","display_name":"Yuan Xie","orcid":"https://orcid.org/0000-0003-2093-1788"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Xie","raw_affiliation_strings":["Alibaba DAMO Academy, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Alibaba DAMO Academy, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026297396","display_name":"Mingyu Gao","orcid":"https://orcid.org/0000-0001-8433-7281"},"institutions":[{"id":"https://openalex.org/I4210122302","display_name":"ShangHai JiAi Genetics & IVF Institute","ror":"https://ror.org/02rgbry52","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210122302"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingyu Gao","raw_affiliation_strings":["Tsinghua University, China / Shanghai Qi Zhi Institute, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua University, China / Shanghai Qi Zhi Institute, China","institution_ids":["https://openalex.org/I4210122302","https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":13.6357,"has_fulltext":true,"cited_by_count":51,"citation_normalized_percentile":{"value":0.99531048,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"747","last_page":"761"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.9692604541778564},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8105074167251587},{"id":"https://openalex.org/keywords/dataflow-architecture","display_name":"Dataflow architecture","score":0.6539202928543091},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6425071954727173},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.6127284169197083},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5576942563056946},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.5305013656616211},{"id":"https://openalex.org/keywords/reconfigurability","display_name":"Reconfigurability","score":0.4567294418811798},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.4120437502861023},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.32495275139808655}],"concepts":[{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.9692604541778564},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8105074167251587},{"id":"https://openalex.org/C176727019","wikidata":"https://www.wikidata.org/wiki/Q1172415","display_name":"Dataflow architecture","level":3,"score":0.6539202928543091},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6425071954727173},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.6127284169197083},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5576942563056946},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.5305013656616211},{"id":"https://openalex.org/C2780149590","wikidata":"https://www.wikidata.org/wiki/Q7302742","display_name":"Reconfigurability","level":2,"score":0.4567294418811798},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.4120437502861023},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32495275139808655},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3575693.3575706","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3575693.3575706","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3575693.3575706","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 2","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-153525","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-153525","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":{"id":"doi:10.1145/3575693.3575706","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3575693.3575706","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3575693.3575706","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 2","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.4399999976158142}],"awards":[{"id":"https://openalex.org/G6501120897","display_name":"\u5927\u5bb9\u91cf\u4e0e\u9ad8\u5e76\u884c\u7684\u53ef\u6269\u5c55\u901a\u7528\u8fd1\u6570\u636e\u5904\u7406\u67b6\u6784\u7814\u7a76","funder_award_id":"62072262","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4318540786.pdf","grobid_xml":"https://content.openalex.org/works/W4318540786.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W1582397847","https://openalex.org/W1992432622","https://openalex.org/W1994687200","https://openalex.org/W2003458338","https://openalex.org/W2053999255","https://openalex.org/W2079288776","https://openalex.org/W2095249664","https://openalex.org/W2096169320","https://openalex.org/W2194775991","https://openalex.org/W2442974303","https://openalex.org/W2516141709","https://openalex.org/W2605347906","https://openalex.org/W2606722458","https://openalex.org/W2612076670","https://openalex.org/W2612387305","https://openalex.org/W2625457103","https://openalex.org/W2794952988","https://openalex.org/W2798724095","https://openalex.org/W2895531329","https://openalex.org/W2904902077","https://openalex.org/W2935331687","https://openalex.org/W2940862705","https://openalex.org/W2952598959","https://openalex.org/W2963367920","https://openalex.org/W2964233199","https://openalex.org/W2979310060","https://openalex.org/W2980186997","https://openalex.org/W2987129023","https://openalex.org/W3008725350","https://openalex.org/W3016542674","https://openalex.org/W3016832937","https://openalex.org/W3091920657","https://openalex.org/W3103168911","https://openalex.org/W3155922894","https://openalex.org/W4240168186","https://openalex.org/W4247198796","https://openalex.org/W4288083528"],"related_works":["https://openalex.org/W2564598376","https://openalex.org/W1484403103","https://openalex.org/W2584408851","https://openalex.org/W2115158825","https://openalex.org/W2101960124","https://openalex.org/W4377693460","https://openalex.org/W2033683327","https://openalex.org/W2783505431","https://openalex.org/W2521947294","https://openalex.org/W4236419692"],"abstract_inverted_index":{"Sparse":[0],"matrix-matrix":[1],"multiplication":[2],"(SpGEMM)":[3],"is":[4,58,184],"widely":[5,74],"used":[6],"in":[7,174],"many":[8],"scientific":[9],"and":[10,23,29,65,121,138,141,157,197,208,224],"deep":[11],"learning":[12],"applications.":[13],"The":[14],"highly":[15],"irregular":[16],"structures":[17],"of":[18,35,46,86,170,202,221],"SpGEMM":[19,40,76,91,195],"limit":[20],"its":[21],"performance":[22,71,200],"efficiency":[24],"on":[25,166],"conventional":[26],"computation":[27],"platforms,":[28],"thus":[30],"motivate":[31],"a":[32,84,103,149,218],"large":[33],"body":[34],"specialized":[36],"hardware":[37,128],"designs.":[38],"Existing":[39],"accelerators":[41,92],"only":[42,59],"support":[43],"specific":[44],"types":[45],"rigid":[47],"execution":[48],"dataflow":[49,57,106,133,161,209],"such":[50],"as":[51],"inner/output-product":[52],"or":[53,188],"row-based":[54],"schemes.":[55],"Each":[56],"optimized":[60,160],"for":[61,90],"certain":[62],"sparse":[63,98,155,171,222],"patterns":[64],"fails":[66],"to":[67,72,93,96,112,115,152,163,186],"generalize":[68],"with":[69,135],"robust":[70],"the":[73,118,154,159,167,190,199,203],"diverse":[75],"workloads":[77],"across":[78,217],"various":[79,97],"domains.":[80],"We":[81],"propose":[82],"Spada,":[83],"combination":[85],"three":[87,193],"novel":[88],"techniques":[89],"efficiently":[94,130],"adapt":[95],"patterns.":[99],"First,":[100],"we":[101,147],"describe":[102],"window-based":[104],"adaptive":[105],"that":[107,182],"can":[108],"be":[109],"flexibly":[110],"adapted":[111],"different":[113,123],"modes":[114],"best":[116,191],"match":[117,187],"data":[119,206],"distributions":[120],"realize":[122],"reuse":[124],"benefits.":[125],"Then,":[126],"our":[127],"architecture":[129],"supports":[131],"this":[132],"template,":[134],"flexible,":[136],"fast,":[137],"low-cost":[139],"reconfigurability":[140],"effective":[142],"load":[143],"balancing":[144],"features.":[145],"Finally,":[146],"use":[148],"profiling-guided":[150],"approach":[151],"detect":[153],"pattern":[156,172],"determine":[158],"mode":[162],"use,":[164],"based":[165],"key":[168],"observations":[169],"similarity":[173],"nearby":[175],"matrix":[176],"regions.":[177],"Our":[178],"evaluation":[179],"results":[180],"demonstrate":[181],"Spada":[183],"able":[185],"exceed":[189],"among":[192],"state-of-the-art":[194],"accelerators,":[196],"avoid":[198],"degradation":[201],"others":[204],"if":[205],"distribution":[207],"mismatch.":[210],"It":[211],"achieves":[212],"an":[213],"average":[214],"1.44\u00d7":[215],"speedup":[216],"wide":[219],"range":[220],"matrices":[223],"compressed":[225],"neural":[226],"network":[227],"models.":[228]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":26},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":4}],"updated_date":"2026-07-02T09:51:11.867554","created_date":"2025-10-10T00:00:00"}
