{"id":"https://openalex.org/W2034669281","doi":"https://doi.org/10.1145/2464996.2467282","title":"Inspector/executor load balancing algorithms for block-sparse tensor contractions","display_name":"Inspector/executor load balancing algorithms for block-sparse tensor contractions","publication_year":2013,"publication_date":"2013-05-28","ids":{"openalex":"https://openalex.org/W2034669281","doi":"https://doi.org/10.1145/2464996.2467282","mag":"2034669281"},"language":"en","primary_location":{"id":"doi:10.1145/2464996.2467282","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2464996.2467282","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th international ACM conference on International conference on supercomputing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103263285","display_name":"David Ozog","orcid":"https://orcid.org/0000-0001-6158-145X"},"institutions":[{"id":"https://openalex.org/I181233156","display_name":"University of Oregon","ror":"https://ror.org/0293rh119","country_code":"US","type":"education","lineage":["https://openalex.org/I181233156"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"David Ozog","raw_affiliation_strings":["University of Oregon, Eugene, Oregon, USA","University of Oregon , Eugene , Oregon , USA"],"affiliations":[{"raw_affiliation_string":"University of Oregon, Eugene, Oregon, USA","institution_ids":["https://openalex.org/I181233156"]},{"raw_affiliation_string":"University of Oregon , Eugene , Oregon , USA","institution_ids":["https://openalex.org/I181233156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023240094","display_name":"Sameer Shende","orcid":"https://orcid.org/0000-0002-2592-669X"},"institutions":[{"id":"https://openalex.org/I181233156","display_name":"University of Oregon","ror":"https://ror.org/0293rh119","country_code":"US","type":"education","lineage":["https://openalex.org/I181233156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sameer Shende","raw_affiliation_strings":["University of Oregon, Eugene, Oregon, USA","University of Oregon , Eugene , Oregon , USA"],"affiliations":[{"raw_affiliation_string":"University of Oregon, Eugene, Oregon, USA","institution_ids":["https://openalex.org/I181233156"]},{"raw_affiliation_string":"University of Oregon , Eugene , Oregon , USA","institution_ids":["https://openalex.org/I181233156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029524538","display_name":"Allen D. Malony","orcid":"https://orcid.org/0000-0002-9598-7201"},"institutions":[{"id":"https://openalex.org/I181233156","display_name":"University of Oregon","ror":"https://ror.org/0293rh119","country_code":"US","type":"education","lineage":["https://openalex.org/I181233156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Allen Malony","raw_affiliation_strings":["University of Oregon, Eugene, Oregon, USA","University of Oregon , Eugene , Oregon , USA"],"affiliations":[{"raw_affiliation_string":"University of Oregon, Eugene, Oregon, USA","institution_ids":["https://openalex.org/I181233156"]},{"raw_affiliation_string":"University of Oregon , Eugene , Oregon , USA","institution_ids":["https://openalex.org/I181233156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081388506","display_name":"Jeff R. Hammond","orcid":"https://orcid.org/0000-0003-3181-8190"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jeff R. Hammond","raw_affiliation_strings":["Argonne National Laboratory, Lemont, Illinois, USA","Argonne National Laboratory, Lemont, Illinois, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, Lemont, Illinois, USA","institution_ids":["https://openalex.org/I1282105669"]},{"raw_affiliation_string":"Argonne National Laboratory, Lemont, Illinois, USA#TAB#","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078425310","display_name":"James Dinan","orcid":"https://orcid.org/0000-0002-4840-7737"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"James Dinan","raw_affiliation_strings":["Argonne National Laboratory, Lemont, Illinois, USA","Argonne National Laboratory, Lemont, Illinois, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, Lemont, Illinois, USA","institution_ids":["https://openalex.org/I1282105669"]},{"raw_affiliation_string":"Argonne National Laboratory, Lemont, Illinois, USA#TAB#","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050531633","display_name":"Pavan Balaji","orcid":null},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pavan Balaji","raw_affiliation_strings":["Argonne National Laboratory, Lemont, Illinois, USA","Argonne National Laboratory, Lemont, Illinois, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, Lemont, Illinois, USA","institution_ids":["https://openalex.org/I1282105669"]},{"raw_affiliation_string":"Argonne National Laboratory, Lemont, Illinois, USA#TAB#","institution_ids":["https://openalex.org/I1282105669"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5103263285"],"corresponding_institution_ids":["https://openalex.org/I181233156"],"apc_list":null,"apc_paid":null,"fwci":3.1715,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.91637241,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"483","last_page":"484"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11809","display_name":"Advanced NMR Techniques and Applications","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/executor","display_name":"Executor","score":0.8507993221282959},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7249515056610107},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5511016845703125},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5064598321914673},{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.4683961868286133},{"id":"https://openalex.org/keywords/load-balancing","display_name":"Load balancing (electrical power)","score":0.4234396517276764},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3372551202774048},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14411216974258423},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.07817602157592773}],"concepts":[{"id":"https://openalex.org/C180591056","wikidata":"https://www.wikidata.org/wiki/Q654437","display_name":"Executor","level":2,"score":0.8507993221282959},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7249515056610107},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5511016845703125},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5064598321914673},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.4683961868286133},{"id":"https://openalex.org/C138959212","wikidata":"https://www.wikidata.org/wiki/Q1806783","display_name":"Load balancing (electrical power)","level":3,"score":0.4234396517276764},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3372551202774048},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14411216974258423},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.07817602157592773},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2464996.2467282","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2464996.2467282","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th international ACM conference on International conference on supercomputing","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.643.1266","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.643.1266","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.mcs.anl.gov/~balaji/pubs/2013/icpp/icpp13.tce-lb.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W99237326","https://openalex.org/W1483744369","https://openalex.org/W1573434297","https://openalex.org/W1584675441","https://openalex.org/W1854155214","https://openalex.org/W1897240848","https://openalex.org/W1968371739","https://openalex.org/W1978455437","https://openalex.org/W1980659426","https://openalex.org/W1984048334","https://openalex.org/W1987734677","https://openalex.org/W1999880473","https://openalex.org/W2001770854","https://openalex.org/W2012458244","https://openalex.org/W2012967522","https://openalex.org/W2017245598","https://openalex.org/W2017583835","https://openalex.org/W2022272738","https://openalex.org/W2022591290","https://openalex.org/W2026858719","https://openalex.org/W2038451118","https://openalex.org/W2052525902","https://openalex.org/W2054658678","https://openalex.org/W2056999868","https://openalex.org/W2062855563","https://openalex.org/W2069326762","https://openalex.org/W2087070363","https://openalex.org/W2092930273","https://openalex.org/W2093135480","https://openalex.org/W2098614082","https://openalex.org/W2098893915","https://openalex.org/W2104680817","https://openalex.org/W2109931506","https://openalex.org/W2109982223","https://openalex.org/W2110256578","https://openalex.org/W2110733790","https://openalex.org/W2118047751","https://openalex.org/W2120432957","https://openalex.org/W2121253712","https://openalex.org/W2127226421","https://openalex.org/W2135653967","https://openalex.org/W2136434791","https://openalex.org/W2146381930","https://openalex.org/W2149970695","https://openalex.org/W2159725480","https://openalex.org/W2312000176","https://openalex.org/W2561675875","https://openalex.org/W4210599536","https://openalex.org/W4233475787","https://openalex.org/W6628875336","https://openalex.org/W6704052874"],"related_works":["https://openalex.org/W2373444402","https://openalex.org/W1533011731","https://openalex.org/W1531488649","https://openalex.org/W2156176624","https://openalex.org/W1513409726","https://openalex.org/W1520923081","https://openalex.org/W1516525278","https://openalex.org/W2381685168","https://openalex.org/W2128313348","https://openalex.org/W1906009434"],"abstract_inverted_index":{"Developing":[0],"effective":[1],"yet":[2],"scalable":[3],"load-balancing":[4,150],"methods":[5,184],"for":[6,37,47],"irregular":[7],"computations":[8],"is":[9,93,188,197,208],"critical":[10],"to":[11,145,210],"the":[12,42,75,83,146,163,168,186],"successful":[13],"application":[14,187,213],"of":[15,20,31,50,64,77,95,100,165,170,182,222],"simulations":[16],"in":[17,134],"a":[18,29,60,191],"variety":[19],"disciplines":[21],"at":[22,70,204],"petascale":[23],"and":[24,33,176],"beyond.":[25],"This":[26],"paper":[27],"explores":[28],"set":[30],"static":[32,78,91],"dynamic":[34,98,121,149],"scheduling":[35,122,164],"algorithms":[36],"block-sparse":[38],"tensor":[39],"contractions":[40],"within":[41,123],"NWChem":[43,135],"computational":[44],"chemistry":[45,141],"code":[46],"different":[48],"degrees":[49],"sparsity":[51],"(and":[52],"therefore":[53],"load":[54,215],"imbalance).":[55],"In":[56,158],"this":[57],"particular":[58],"application,":[59],"relatively":[61],"large":[62,192],"amount":[63],"task":[65,85,101],"information":[66],"can":[67],"be":[68],"obtained":[69],"minimal":[71],"cost,":[72],"which":[73,128],"enables":[74],"use":[76],"partitioning":[79,92],"techniques":[80],"that":[81,119],"take":[82],"entire":[84],"list":[86],"as":[87,104,152,154,200,202],"input.":[88],"However,":[89],"fully":[90],"incapable":[94],"dealing":[96],"with":[97],"variation":[99],"costs,":[102],"such":[103],"from":[105,167],"transient":[106],"network":[107],"contention":[108],"or":[109,136,220],"operating":[110],"system":[111],"noise,":[112],"so":[113],"we":[114,161],"also":[115],"consider":[116],"hybrid":[117],"schemes":[118],"utilize":[120],"subgroups.":[124],"These":[125],"two":[126],"schemes,":[127],"have":[129],"not":[130],"been":[131],"previously":[132],"implemented":[133],"its":[137],"proxies":[138],"(i.e.":[139],"quantum":[140],"mini-apps)":[142],"are":[143,226],"compared":[144],"original":[147],"centralized":[148,156],"algorithm":[151],"well":[153],"improved":[155],"scheme.":[157],"all":[159],"cases,":[160],"separate":[162],"tasks":[166,171],"execution":[169,195,224],"into":[172],"an":[173,177],"inspector":[174],"phase":[175],"executor":[178],"phase.":[179],"The":[180,206],"impact":[181],"these":[183],"upon":[185],"substantial":[189],"on":[190],"InfiniBand":[193],"cluster:":[194],"time":[196],"reduced":[198],"by":[199],"much":[201],"50%":[203],"scale.":[205],"technique":[207],"applicable":[209],"any":[211],"scientific":[212],"requiring":[214],"balance":[216],"where":[217],"performance":[218],"models":[219],"estimations":[221],"kernel":[223],"times":[225],"available.":[227]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
