{"id":"https://openalex.org/W4294734199","doi":"https://doi.org/10.1145/3561652","title":"Design and Implementation for Nonblocking Execution in GraphBLAS: Tradeoffs and Performance","display_name":"Design and Implementation for Nonblocking Execution in GraphBLAS: Tradeoffs and Performance","publication_year":2022,"publication_date":"2022-09-06","ids":{"openalex":"https://openalex.org/W4294734199","doi":"https://doi.org/10.1145/3561652"},"language":"en","primary_location":{"id":"doi:10.1145/3561652","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3561652","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3561652","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3561652","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028216967","display_name":"Aristeidis Mastoras","orcid":"https://orcid.org/0000-0002-5235-8499"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Aristeidis Mastoras","raw_affiliation_strings":["Computing Systems Laboratory, Zurich Research Center, Huawei Technologies Switzerland AG, Z\u00fcrich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-5235-8499","affiliations":[{"raw_affiliation_string":"Computing Systems Laboratory, Zurich Research Center, Huawei Technologies Switzerland AG, Z\u00fcrich, Switzerland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030953545","display_name":"Sotiris Anagnostidis","orcid":"https://orcid.org/0000-0001-8012-3331"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Sotiris Anagnostidis","raw_affiliation_strings":["Department of Computer Science, ETH Zurich, Z\u00fcrich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0001-8012-3331","affiliations":[{"raw_affiliation_string":"Department of Computer Science, ETH Zurich, Z\u00fcrich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012014394","display_name":"Albert-Jan N. Yzelman","orcid":"https://orcid.org/0000-0001-8842-3689"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Albert-Jan N. Yzelman","raw_affiliation_strings":["Computing Systems Laboratory, Zurich Research Center, Huawei Technologies Switzerland AG, Z\u00fcrich, Switzerland"],"raw_orcid":"https://orcid.org/0000-0001-8842-3689","affiliations":[{"raw_affiliation_string":"Computing Systems Laboratory, Zurich Research Center, Huawei Technologies Switzerland AG, Z\u00fcrich, Switzerland","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5028216967"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.632,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.82493274,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"20","issue":"1","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9264786243438721},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.8949580788612366},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.7664529085159302},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7509851455688477},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.5521072149276733},{"id":"https://openalex.org/keywords/locality-of-reference","display_name":"Locality of reference","score":0.5503796339035034},{"id":"https://openalex.org/keywords/blocking","display_name":"Blocking (statistics)","score":0.5144920349121094}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9264786243438721},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.8949580788612366},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.7664529085159302},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7509851455688477},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.5521072149276733},{"id":"https://openalex.org/C27602214","wikidata":"https://www.wikidata.org/wiki/Q1868547","display_name":"Locality of reference","level":3,"score":0.5503796339035034},{"id":"https://openalex.org/C144745244","wikidata":"https://www.wikidata.org/wiki/Q4927286","display_name":"Blocking (statistics)","level":2,"score":0.5144920349121094},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3561652","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3561652","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3561652","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3561652","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3561652","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3561652","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4294734199.pdf","grobid_xml":"https://content.openalex.org/works/W4294734199.grobid-xml"},"referenced_works_count":20,"referenced_works":["https://openalex.org/W1533528239","https://openalex.org/W1590602635","https://openalex.org/W1607380961","https://openalex.org/W2035080386","https://openalex.org/W2049890071","https://openalex.org/W2050129046","https://openalex.org/W2271295020","https://openalex.org/W2755088640","https://openalex.org/W2762661956","https://openalex.org/W2914097545","https://openalex.org/W2937604920","https://openalex.org/W2964357930","https://openalex.org/W2973134322","https://openalex.org/W2987548385","https://openalex.org/W2990689488","https://openalex.org/W2995872593","https://openalex.org/W3009867679","https://openalex.org/W3100839241","https://openalex.org/W4289827899","https://openalex.org/W4294761111"],"related_works":["https://openalex.org/W1555349535","https://openalex.org/W2583128298","https://openalex.org/W2053359564","https://openalex.org/W2161159383","https://openalex.org/W1495260638","https://openalex.org/W1511204342","https://openalex.org/W2369125128","https://openalex.org/W2369223577","https://openalex.org/W2010020348","https://openalex.org/W4238138329"],"abstract_inverted_index":{"GraphBLASis":[0],"a":[1,50,115,143,192],"recent":[2],"standard":[3],"that":[4,55,66,77,174,203],"allows":[5],"the":[6,12,97,100,122,154,163,178,189,217,227,230],"expression":[7],"of":[8,14,86,90,99,124,130,145,229],"graph":[9],"algorithms":[10],"in":[11,59,81,93,213],"language":[13],"linear":[15,200],"algebra":[16,201],"and":[17,22,29,53,70,96,185,207,216],"enables":[18,63],"automatic":[19,168],"code":[20],"parallelization":[21],"optimization.":[23],"GraphBLAS":[24],"operations":[25,76,91],"are":[26,108],"memory":[27],"bound":[28],"may":[30,78],"benefit":[31],"from":[32],"data":[33,68,72,80],"locality":[34],"optimizations":[35,65,209],"enabled":[36],"by":[37,133,176],"nonblocking":[38,41,57,84,101,125,155,219],"execution.":[39,165],"However,":[40],"execution":[42,58,85,102,126,141,156,206,220],"remains":[43],"under-evaluated.":[44],"In":[45],"this":[46,214],"article,":[47],"we":[48],"present":[49],"novel":[51],"design":[52],"implementation":[54],"investigates":[56],"GraphBLAS.":[60],"Lazy":[61],"evaluation":[62,120,190],"runtime":[64],"improve":[67],"locality,":[69],"dynamic":[71,94],"dependence":[73],"analysis":[74],"identifies":[75],"reuse":[79],"cache.":[82],"The":[83,119,149,166],"an":[87],"arbitrary":[88],"number":[89],"results":[92],"parallelism,":[95],"performance":[98,169],"depends":[103],"on":[104,114],"two":[105],"parameters,":[106],"which":[107],"automatically":[109],"determined,":[110],"at":[111],"run-time,":[112],"based":[113],"proposed":[116,150],"analytic":[117,151],"model.":[118],"confirms":[121],"importance":[123],"for":[127,182,198],"various":[128],"matrices":[129],"three":[131],"algorithms,":[132],"showing":[134],"up":[135,158,222],"to":[136,159,173,210,223],"4.11\u00d7":[137],"speedup":[138,161,225],"over":[139,162,226],"blocking":[140,164],"as":[142],"result":[144],"better":[146],"cache":[147],"utilization.":[148],"model":[152],"makes":[153],"reach":[157],"5.13\u00d7":[160],"fully":[167],"is":[170],"very":[171],"close":[172],"obtained":[175],"using":[177],"best":[179],"manual":[180],"configuration":[181],"both":[183],"small":[184],"large":[186],"matrices.":[187],"Finally,":[188],"includes":[191],"comparison":[193],"with":[194],"other":[195],"state-of-the-art":[196],"frameworks":[197],"numerical":[199],"programming":[202],"employ":[204],"parallel":[205],"similar":[208],"those":[211],"discussed":[212],"work,":[215],"presented":[218],"reaches":[221],"16.1\u00d7":[224],"state":[228],"art.":[231]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2023,"cited_by_count":2}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
