{"id":"https://openalex.org/W3202821777","doi":"https://doi.org/10.1145/3472456.3472522","title":"Optimizing Work Stealing Communication with Structured Atomic Operations","display_name":"Optimizing Work Stealing Communication with Structured Atomic Operations","publication_year":2021,"publication_date":"2021-08-09","ids":{"openalex":"https://openalex.org/W3202821777","doi":"https://doi.org/10.1145/3472456.3472522","mag":"3202821777"},"language":"en","primary_location":{"id":"doi:10.1145/3472456.3472522","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3472456.3472522","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3472456.3472522","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"50th International Conference on Parallel Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3472456.3472522","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009125571","display_name":"Hannah Cartier","orcid":null},"institutions":[{"id":"https://openalex.org/I117979880","display_name":"Rhodes College","ror":"https://ror.org/049xfwy04","country_code":"US","type":"education","lineage":["https://openalex.org/I117979880"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hannah Cartier","raw_affiliation_strings":["Rhodes College"],"affiliations":[{"raw_affiliation_string":"Rhodes College","institution_ids":["https://openalex.org/I117979880"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078425310","display_name":"James Dinan","orcid":"https://orcid.org/0000-0002-4840-7737"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"James Dinan","raw_affiliation_strings":["NVIDIA"],"affiliations":[{"raw_affiliation_string":"NVIDIA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024096606","display_name":"D. Brian Larkins","orcid":"https://orcid.org/0000-0002-2131-0847"},"institutions":[{"id":"https://openalex.org/I117979880","display_name":"Rhodes College","ror":"https://ror.org/049xfwy04","country_code":"US","type":"education","lineage":["https://openalex.org/I117979880"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"D. Brian Larkins","raw_affiliation_strings":["Rhodes College"],"affiliations":[{"raw_affiliation_string":"Rhodes College","institution_ids":["https://openalex.org/I117979880"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5009125571"],"corresponding_institution_ids":["https://openalex.org/I117979880"],"apc_list":null,"apc_paid":null,"fwci":0.2022,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.51591836,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8492444753646851},{"id":"https://openalex.org/keywords/queue","display_name":"Queue","score":0.6664255857467651},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.659040093421936},{"id":"https://openalex.org/keywords/load-balancing","display_name":"Load balancing (electrical power)","score":0.6198219060897827},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5722993612289429},{"id":"https://openalex.org/keywords/message-queue","display_name":"Message queue","score":0.5158118605613708},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.5022621154785156},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4933132231235504},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.49073541164398193},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.46513527631759644},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.3290429711341858},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.19815143942832947},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.1328190267086029},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.11326479911804199},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.11147123575210571}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8492444753646851},{"id":"https://openalex.org/C160403385","wikidata":"https://www.wikidata.org/wiki/Q220543","display_name":"Queue","level":2,"score":0.6664255857467651},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.659040093421936},{"id":"https://openalex.org/C138959212","wikidata":"https://www.wikidata.org/wiki/Q1806783","display_name":"Load balancing (electrical power)","level":3,"score":0.6198219060897827},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5722993612289429},{"id":"https://openalex.org/C26324664","wikidata":"https://www.wikidata.org/wiki/Q1065525","display_name":"Message queue","level":2,"score":0.5158118605613708},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.5022621154785156},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4933132231235504},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.49073541164398193},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.46513527631759644},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3290429711341858},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.19815143942832947},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.1328190267086029},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.11326479911804199},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.11147123575210571},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3472456.3472522","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3472456.3472522","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3472456.3472522","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"50th International Conference on Parallel Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3472456.3472522","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3472456.3472522","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3472456.3472522","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"50th International Conference on Parallel Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3338472867","display_name":null,"funder_award_id":"ACI-1053575","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5642555396","display_name":null,"funder_award_id":"ACI-10535","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5921281487","display_name":null,"funder_award_id":"number","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6778350887","display_name":null,"funder_award_id":"1053575","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7331974020","display_name":null,"funder_award_id":"ACI-1053575.","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7918953861","display_name":null,"funder_award_id":"2018758","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3202821777.pdf","grobid_xml":"https://content.openalex.org/works/W3202821777.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W1529391588","https://openalex.org/W1612065083","https://openalex.org/W2019028742","https://openalex.org/W2019380637","https://openalex.org/W2036551003","https://openalex.org/W2040466547","https://openalex.org/W2042088790","https://openalex.org/W2054583871","https://openalex.org/W2056333732","https://openalex.org/W2070587796","https://openalex.org/W2072725684","https://openalex.org/W2079031056","https://openalex.org/W2109065830","https://openalex.org/W2132745343","https://openalex.org/W2146381930","https://openalex.org/W2147685859","https://openalex.org/W2157124218","https://openalex.org/W2161989797","https://openalex.org/W2168339347","https://openalex.org/W2558246989","https://openalex.org/W2678866158","https://openalex.org/W2963102613","https://openalex.org/W3012343893","https://openalex.org/W4250588632"],"related_works":["https://openalex.org/W2392768766","https://openalex.org/W2058118494","https://openalex.org/W2095118173","https://openalex.org/W2382021449","https://openalex.org/W2104269053","https://openalex.org/W2106424170","https://openalex.org/W2501188010","https://openalex.org/W4299935056","https://openalex.org/W2768810474","https://openalex.org/W4206575749"],"abstract_inverted_index":{"Applications":[0],"that":[1,51,66,144],"rely":[2],"on":[3,13,195],"sparse":[4,196],"or":[5],"irregular":[6],"data":[7],"are":[8,118],"often":[9],"challenging":[10],"to":[11,29,38,76],"scale":[12],"modern":[14],"distributed-memory":[15],"systems.":[16],"As":[17],"a":[18,35,46,59,70,91,98,113,121,146],"result,":[19],"these":[20],"systems":[21,168],"typically":[22],"require":[23],"continuous":[24],"load":[25,166],"balancing":[26,167],"in":[27,67,120,133,180,190],"order":[28],"maintain":[30],"efficiency.":[31],"Work":[32],"stealing":[33,50,96],"is":[34,135],"common":[36],"technique":[37],"remedy":[39],"imbalance.":[40],"In":[41],"this":[42,158],"work":[43,49,89,95,104],"we":[44,82],"present":[45],"strategy":[47,159],"for":[48,58,69,127,163,170],"reduces":[52,182],"the":[53,78,125,138,155,178],"amount":[54,72],"of":[55,73,102,141,149,157],"communication":[56,123,134,181],"required":[57],"steal":[60,187],"operation":[61],"by":[62],"half.":[63],"We":[64,153],"show":[65,177],"exchange":[68],"small":[71],"additional":[74],"complexity":[75],"manage":[77],"local":[79],"queue":[80,151],"state":[81],"can":[83],"combine":[84],"both":[85,116],"discovering":[86,103],"and":[87,105,169,186],"claiming":[88,107],"into":[90],"single":[92],"step.":[93],"Conventionally,":[94],"uses":[97],"two":[99],"step":[100],"process":[101],"then":[106],"it.":[108],"Our":[109,175],"system,":[110],"SWS,":[111],"provides":[112],"mechanism":[114],"where":[115],"processes":[117],"performed":[119],"singular":[122],"without":[124],"need":[126],"multiple":[128],"synchronization":[129],"messages.":[130],"This":[131],"reduction":[132,179],"possible":[136],"with":[137],"novel":[139],"application":[140],"atomic":[142],"operations":[143],"manipulate":[145],"compact":[147],"representation":[148],"task":[150,183],"metadata.":[152],"demonstrate":[154],"effectiveness":[156],"using":[160],"known":[161],"benchmarks":[162],"testing":[164],"dynamic":[165],"performing":[171],"unbalanced":[172],"tree":[173],"searches.":[174],"results":[176],"acquisition":[184],"time":[185],"time,":[188],"which":[189],"turn":[191],"improves":[192],"overall":[193],"performance":[194],"computations.":[197]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
