{"id":"https://openalex.org/W2320043833","doi":"https://doi.org/10.1145/2858652","title":"Leveraging Hardware Message Passing for Efficient Thread Synchronization","display_name":"Leveraging Hardware Message Passing for Efficient Thread Synchronization","publication_year":2016,"publication_date":"2016-01-29","ids":{"openalex":"https://openalex.org/W2320043833","doi":"https://doi.org/10.1145/2858652","mag":"2320043833"},"language":"en","primary_location":{"id":"doi:10.1145/2858652","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2858652","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046020902","display_name":"Darko Petrovi\u0107","orcid":null},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Darko Petrovi\u0107","raw_affiliation_strings":["Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland"],"affiliations":[{"raw_affiliation_string":"Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064121950","display_name":"Thomas Ropars","orcid":null},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Thomas Ropars","raw_affiliation_strings":["Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland"],"affiliations":[{"raw_affiliation_string":"Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111458171","display_name":"Andr\u00e9 Schiper","orcid":null},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Andr\u00e9 Schiper","raw_affiliation_strings":["Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland"],"affiliations":[{"raw_affiliation_string":"Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland","institution_ids":["https://openalex.org/I5124864"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5046020902"],"corresponding_institution_ids":["https://openalex.org/I5124864"],"apc_list":null,"apc_paid":null,"fwci":1.1581,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.80248375,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"2","issue":"4","first_page":"1","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.889638364315033},{"id":"https://openalex.org/keywords/cache-coherence","display_name":"Cache coherence","score":0.61427241563797},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6142658591270447},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.6016308069229126},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.5342758297920227},{"id":"https://openalex.org/keywords/shared-memory","display_name":"Shared memory","score":0.5288801193237305},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.5064448118209839},{"id":"https://openalex.org/keywords/queue","display_name":"Queue","score":0.43012186884880066},{"id":"https://openalex.org/keywords/cpu-cache","display_name":"CPU cache","score":0.36108332872390747},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.33859506249427795},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.3141138553619385},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.25735074281692505},{"id":"https://openalex.org/keywords/cache-algorithms","display_name":"Cache algorithms","score":0.14917150139808655}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.889638364315033},{"id":"https://openalex.org/C141917322","wikidata":"https://www.wikidata.org/wiki/Q1025017","display_name":"Cache coherence","level":5,"score":0.61427241563797},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6142658591270447},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.6016308069229126},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.5342758297920227},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.5288801193237305},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.5064448118209839},{"id":"https://openalex.org/C160403385","wikidata":"https://www.wikidata.org/wiki/Q220543","display_name":"Queue","level":2,"score":0.43012186884880066},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.36108332872390747},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.33859506249427795},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.3141138553619385},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.25735074281692505},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.14917150139808655},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2858652","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2858652","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.800000011920929,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1501380952","https://openalex.org/W1525350307","https://openalex.org/W1974420955","https://openalex.org/W1979885075","https://openalex.org/W1981393723","https://openalex.org/W1983572666","https://openalex.org/W1992679913","https://openalex.org/W2001738739","https://openalex.org/W2014345013","https://openalex.org/W2031844067","https://openalex.org/W2047400318","https://openalex.org/W2049013629","https://openalex.org/W2054739713","https://openalex.org/W2073407658","https://openalex.org/W2100817684","https://openalex.org/W2101939036","https://openalex.org/W2111470409","https://openalex.org/W2114688360","https://openalex.org/W2119887431","https://openalex.org/W2132220514","https://openalex.org/W2134058640","https://openalex.org/W2138404963","https://openalex.org/W2151460056","https://openalex.org/W2152455393","https://openalex.org/W2166263713","https://openalex.org/W2168075869","https://openalex.org/W2198138176","https://openalex.org/W2225140656","https://openalex.org/W2995394804","https://openalex.org/W4245607618"],"related_works":["https://openalex.org/W2118508246","https://openalex.org/W1979099492","https://openalex.org/W97688277","https://openalex.org/W4255008187","https://openalex.org/W2407815036","https://openalex.org/W4250205214","https://openalex.org/W2143087414","https://openalex.org/W1797968800","https://openalex.org/W2549803267","https://openalex.org/W3216777841"],"abstract_inverted_index":{"As":[0],"the":[1,34,37,56,115,129,136,144,161,184,194,208],"level":[2],"of":[3,36,59,106,117,135],"parallelism":[4],"in":[5,16],"manycore":[6],"processors":[7],"keeps":[8],"increasing,":[9],"providing":[10],"efficient":[11,216],"mechanisms":[12],"for":[13,48,66],"thread":[14],"synchronization":[15,28,53,119,210],"concurrent":[17],"programs":[18],"is":[19,30,131,146],"becoming":[20],"a":[21,77,104,132,147],"major":[22],"concern.":[23],"On":[24],"cache-coherent":[25],"shared-memory":[26],"processors,":[27],"efficiency":[29],"ultimately":[31],"limited":[32],"by":[33,94],"performance":[35,191],"underlying":[38],"cache":[39,179],"coherence":[40,180],"protocol.":[41],"This":[42],"article":[43],"studies":[44],"how":[45],"hardware":[46,110,140],"support":[47],"message":[49,111,141],"passing":[50],"can":[51,168,188],"improve":[52],"performance.":[54],"Considering":[55],"ubiquitous":[57],"problem":[58],"mutual":[60],"exclusion,":[61],"we":[62,123],"devise":[63],"novel":[64,148],"algorithms":[65],"(i)":[67],"classic":[68,98,164],"locking,":[69,99],"where":[70,90],"application":[71],"threads":[72],"obtain":[73],"exclusive":[74],"access":[75],"to":[76,81,139,178,196],"shared":[78,107],"resource":[79],"prior":[80],"executing":[82],"their":[83,214],"critical":[84,185],"sections":[85],"(CSes),":[86],"and":[87,109,126,203],"(ii)":[88],"delegation,":[89,122],"CSes":[91,171],"are":[92,181],"executed":[93],"special":[95],"threads.":[96],"For":[97,121],"our":[100,201],"HybLock":[101,159],"algorithm":[102],"uses":[103],"mix":[105],"memory":[108],"passing,":[112,142],"which":[113],"introduces":[114],"idea":[116],"hybrid":[118,149],"algorithms.":[120],"propose":[124],"mp-server":[125,167],"HybComb":[127,187],":":[128],"former":[130],"straightforward":[133],"adaptation":[134],"server":[137,198],"approach":[138],"whereas":[143],"latter":[145],"combining":[150],"algorithm.":[151],"Evaluation":[152],"on":[153,207],"Tilera's":[154],"TILE-Gx":[155],"processor":[156],"shows":[157],"that":[158],"outperforms":[160],"best":[162],"known":[163],"locks.":[165],"Furthermore,":[166],"execute":[169],"contended":[170],"with":[172],"unprecedented":[173],"throughput,":[174],"as":[175],"stalls":[176],"related":[177],"removed":[182],"from":[183],"path.":[186],"achieve":[189],"comparable":[190],"while":[192],"avoiding":[193],"need":[195],"dedicate":[197],"cores.":[199],"Consequently,":[200],"queue":[202],"stack":[204],"implementations,":[205],"based":[206],"new":[209],"algorithms,":[211],"largely":[212],"outperform":[213],"most":[215],"shared-memory-only":[217],"counterparts.":[218]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
