{"id":"https://openalex.org/W2891832717","doi":"https://doi.org/10.1145/3205289.3205313","title":"Towards Efficient SpMV on Sunway Manycore Architectures","display_name":"Towards Efficient SpMV on Sunway Manycore Architectures","publication_year":2018,"publication_date":"2018-06-12","ids":{"openalex":"https://openalex.org/W2891832717","doi":"https://doi.org/10.1145/3205289.3205313","mag":"2891832717"},"language":"en","primary_location":{"id":"doi:10.1145/3205289.3205313","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3205289.3205313","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 International Conference on Supercomputing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101869479","display_name":"Changxi Liu","orcid":"https://orcid.org/0000-0001-9240-5926"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Changxi Liu","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107771061","display_name":"Biwei Xie","orcid":"https://orcid.org/0000-0003-4045-6806"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Biwei Xie","raw_affiliation_strings":["State Key Laboratory of Computer Architecture, Institute of Computing Technology, Chinese Academy of Sciences, University of Chinese, Academy of Sciences, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Computer Architecture, Institute of Computing Technology, Chinese Academy of Sciences, University of Chinese, Academy of Sciences, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100352268","display_name":"Xin Liu","orcid":"https://orcid.org/0000-0002-7870-6535"},"institutions":[{"id":"https://openalex.org/I16285277","display_name":"William & Mary","ror":"https://ror.org/03hsf0573","country_code":"US","type":"education","lineage":["https://openalex.org/I16285277"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xin Liu","raw_affiliation_strings":["Department of Computer Science, College of William and Mary, USA","National Research Centre of Parallel Computer Engineering and Technology, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, College of William and Mary, USA","institution_ids":["https://openalex.org/I16285277"]},{"raw_affiliation_string":"National Research Centre of Parallel Computer Engineering and Technology, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091437474","display_name":"Wei Xue","orcid":"https://orcid.org/0000-0001-9740-6581"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Xue","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018705589","display_name":"Hailong Yang","orcid":"https://orcid.org/0000-0003-1101-7927"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hailong Yang","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100331713","display_name":"Xu Liu","orcid":"https://orcid.org/0000-0002-8984-5485"},"institutions":[{"id":"https://openalex.org/I16285277","display_name":"William & Mary","ror":"https://ror.org/03hsf0573","country_code":"US","type":"education","lineage":["https://openalex.org/I16285277"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xu Liu","raw_affiliation_strings":["Department of Computer Science, College of William and Mary, USA","National Research Centre of Parallel Computer Engineering and Technology, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, College of William and Mary, USA","institution_ids":["https://openalex.org/I16285277"]},{"raw_affiliation_string":"National Research Centre of Parallel Computer Engineering and Technology, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101869479"],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":8.079,"has_fulltext":false,"cited_by_count":51,"citation_normalized_percentile":{"value":0.9811782,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"363","last_page":"373"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8489981293678284},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7870535850524902},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.5174041986465454},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5123401880264282},{"id":"https://openalex.org/keywords/porting","display_name":"Porting","score":0.49121493101119995},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.4456588923931122},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.4111907482147217},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.1189764142036438},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.0948876142501831},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08406206965446472}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8489981293678284},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7870535850524902},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.5174041986465454},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5123401880264282},{"id":"https://openalex.org/C106251023","wikidata":"https://www.wikidata.org/wiki/Q851989","display_name":"Porting","level":3,"score":0.49121493101119995},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.4456588923931122},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.4111907482147217},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.1189764142036438},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0948876142501831},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08406206965446472},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3205289.3205313","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3205289.3205313","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 International Conference on Supercomputing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.5299999713897705,"id":"https://metadata.un.org/sdg/9"}],"awards":[{"id":"https://openalex.org/G4755521671","display_name":null,"funder_award_id":"61502019,91530323,41776010","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1506342804","https://openalex.org/W1975116854","https://openalex.org/W1981902599","https://openalex.org/W1987840949","https://openalex.org/W1990832096","https://openalex.org/W1993704253","https://openalex.org/W2003117296","https://openalex.org/W2009654791","https://openalex.org/W2023930909","https://openalex.org/W2035080386","https://openalex.org/W2088866486","https://openalex.org/W2091883426","https://openalex.org/W2095292158","https://openalex.org/W2115052535","https://openalex.org/W2126004407","https://openalex.org/W2128539477","https://openalex.org/W2128853364","https://openalex.org/W2136324023","https://openalex.org/W2162283062","https://openalex.org/W2415007423","https://openalex.org/W2475126267","https://openalex.org/W2559809597","https://openalex.org/W2561247022","https://openalex.org/W2728256789","https://openalex.org/W2730450744","https://openalex.org/W2730740223","https://openalex.org/W2767373187","https://openalex.org/W2788264912","https://openalex.org/W2789228469","https://openalex.org/W2791012218","https://openalex.org/W3125710003","https://openalex.org/W4238995617","https://openalex.org/W4243261006","https://openalex.org/W4248980851"],"related_works":["https://openalex.org/W2356602486","https://openalex.org/W2351992668","https://openalex.org/W2324828474","https://openalex.org/W2374315191","https://openalex.org/W2391207559","https://openalex.org/W2384715785","https://openalex.org/W2349624418","https://openalex.org/W2064459023","https://openalex.org/W2384611437","https://openalex.org/W2886568922"],"abstract_inverted_index":{"Sparse":[0],"Matrix-Vector":[1],"Multiplication":[2],"(SpMV)":[3],"is":[4,25,143],"an":[5],"essential":[6],"computation":[7,124],"kernel":[8],"for":[9,98],"many":[10,57],"data-analytic":[11],"workloads":[12],"running":[13],"in":[14,23,108,120],"both":[15,75],"supercomputers":[16],"and":[17,46,78,84,96,114,125,150],"data":[18],"centers.":[19],"The":[20],"intrinsic":[21],"irregularity":[22],"SpMV":[24,49,148,162],"challenging":[26],"to":[27,34,81,136,146,176],"achieve":[28],"high":[29],"performance,":[30],"especially":[31],"when":[32],"porting":[33],"new":[35],"architectures.":[36],"In":[37],"this":[38],"paper,":[39],"we":[40,66,89,105,129,154],"present":[41],"our":[42,157,172],"work":[43],"on":[44,51,74,167,179],"designing":[45],"implementing":[47],"efficient":[48],"algorithms":[50],"Sunway,":[52],"a":[53,69,109,121,160],"novel":[54],"architecture":[55],"with":[56],"unique":[58],"features.":[59],"To":[60],"fully":[61],"exploit":[62],"the":[63,102,132,139],"Sunway":[64,110],"architecture,":[65],"have":[67,130,155],"designed":[68],"dual-side":[70],"multi-level":[71],"partition":[72,90,106],"mechanism":[73],"sparse":[76,91],"matrices":[77,92],"hardware":[79],"resources":[80],"improve":[82,138],"locality":[83],"parallelism.":[85],"On":[86,101],"one":[87],"hand,":[88,104],"into":[93,112],"blocks,":[94],"tiles,":[95],"slices":[97],"different":[99,147],"granularities.":[100],"other":[103],"cores":[107,119],"processor":[111],"fleets,":[113],"further":[115,137],"dedicate":[116],"part":[117],"of":[118],"fleet":[122],"as":[123],"I/O":[126],"cores.":[127],"Moreover,":[128],"optimized":[131],"communication":[133],"between":[134],"partitions":[135],"performance.":[140],"Our":[141],"scheme":[142],"generally":[144],"applicable":[145],"formats":[149],"implementations.":[151],"For":[152],"evaluation,":[153],"applied":[156],"techniques":[158],"atop":[159],"popular":[161],"format,":[163],"CSR.":[164],"Experimental":[165],"results":[166],"18":[168],"datasets":[169],"show":[170],"that":[171],"optimization":[173],"yields":[174],"up":[175],"15.5x":[177],"(12.3x":[178],"average)":[180],"speedups.":[181]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":15},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
