{"id":"https://openalex.org/W3007668436","doi":"https://doi.org/10.1109/tpds.2020.2976057","title":"Analyzing the Performance Trade-Off in Implementing User-Level Threads","display_name":"Analyzing the Performance Trade-Off in Implementing User-Level Threads","publication_year":2020,"publication_date":"2020-02-28","ids":{"openalex":"https://openalex.org/W3007668436","doi":"https://doi.org/10.1109/tpds.2020.2976057","mag":"3007668436"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2020.2976057","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.2976057","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.osti.gov/biblio/1660747","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076576150","display_name":"Shintaro Iwasaki","orcid":"https://orcid.org/0000-0002-4748-8459"},"institutions":[{"id":"https://openalex.org/I14396692","display_name":"Tokyo University of Information Sciences","ror":"https://ror.org/044bdx604","country_code":"JP","type":"education","lineage":["https://openalex.org/I14396692"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Shintaro Iwasaki","raw_affiliation_strings":["Department of Information and Communication Engineering, University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Information and Communication Engineering, University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I14396692","https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103934446","display_name":"Abdelhalim Amer","orcid":"https://orcid.org/0000-0001-5856-0172"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abdelhalim Amer","raw_affiliation_strings":["Mathematics and Computer Science Division, Argonne National Laboratory, Lemont, USA"],"affiliations":[{"raw_affiliation_string":"Mathematics and Computer Science Division, Argonne National Laboratory, Lemont, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009359355","display_name":"Kenjiro Taura","orcid":"https://orcid.org/0000-0001-5224-382X"},"institutions":[{"id":"https://openalex.org/I14396692","display_name":"Tokyo University of Information Sciences","ror":"https://ror.org/044bdx604","country_code":"JP","type":"education","lineage":["https://openalex.org/I14396692"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kenjiro Taura","raw_affiliation_strings":["Department of Information and Communication Engineering, University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Information and Communication Engineering, University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I14396692","https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050531633","display_name":"Pavan Balaji","orcid":null},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pavan Balaji","raw_affiliation_strings":["Mathematical and Computer Science, Argonne National Laboratory, Lemont, USA"],"affiliations":[{"raw_affiliation_string":"Mathematical and Computer Science, Argonne National Laboratory, Lemont, USA","institution_ids":["https://openalex.org/I1282105669"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5076576150"],"corresponding_institution_ids":["https://openalex.org/I14396692","https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":1.1786,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.75962216,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"31","issue":"8","first_page":"1859","last_page":"1877"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8583364486694336},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.4780876338481903},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4567289650440216},{"id":"https://openalex.org/keywords/processor-scheduling","display_name":"Processor scheduling","score":0.44216081500053406},{"id":"https://openalex.org/keywords/multithreading","display_name":"Multithreading","score":0.41502341628074646},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.33696720004081726},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.3360848128795624},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.27419912815093994}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8583364486694336},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.4780876338481903},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4567289650440216},{"id":"https://openalex.org/C2984822820","wikidata":"https://www.wikidata.org/wiki/Q1123036","display_name":"Processor scheduling","level":3,"score":0.44216081500053406},{"id":"https://openalex.org/C201410400","wikidata":"https://www.wikidata.org/wiki/Q1064412","display_name":"Multithreading","level":3,"score":0.41502341628074646},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.33696720004081726},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3360848128795624},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.27419912815093994},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpds.2020.2976057","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.2976057","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},{"id":"pmh:oai:osti.gov:1660747","is_oa":true,"landing_page_url":"https://www.osti.gov/biblio/1660747","pdf_url":null,"source":{"id":"https://openalex.org/S4306402487","display_name":"OSTI OAI (U.S. Department of Energy Office of Scientific and Technical Information)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I139351228","host_organization_name":"Office of Scientific and Technical Information","host_organization_lineage":["https://openalex.org/I139351228"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"pmh:oai:osti.gov:1660747","is_oa":true,"landing_page_url":"https://www.osti.gov/biblio/1660747","pdf_url":null,"source":{"id":"https://openalex.org/S4306402487","display_name":"OSTI OAI (U.S. Department of Energy Office of Scientific and Technical Information)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I139351228","host_organization_name":"Office of Scientific and Technical Information","host_organization_lineage":["https://openalex.org/I139351228"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7954425250","display_name":null,"funder_award_id":"DE-AC02-06CH11357","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"}],"funders":[{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320332369","display_name":"National Nuclear Security Administration","ror":"https://ror.org/03sk1we31"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W1521891776","https://openalex.org/W1535758606","https://openalex.org/W1536852470","https://openalex.org/W1583973024","https://openalex.org/W1861208929","https://openalex.org/W1965351873","https://openalex.org/W1967882079","https://openalex.org/W1968020161","https://openalex.org/W1976573773","https://openalex.org/W1984054440","https://openalex.org/W1994549753","https://openalex.org/W1999241319","https://openalex.org/W2016559894","https://openalex.org/W2032404535","https://openalex.org/W2037574360","https://openalex.org/W2038013988","https://openalex.org/W2046814629","https://openalex.org/W2062273873","https://openalex.org/W2069765416","https://openalex.org/W2072725684","https://openalex.org/W2079577430","https://openalex.org/W2084423328","https://openalex.org/W2091905905","https://openalex.org/W2093127332","https://openalex.org/W2096898433","https://openalex.org/W2099887980","https://openalex.org/W2101132897","https://openalex.org/W2104861744","https://openalex.org/W2108801243","https://openalex.org/W2131296084","https://openalex.org/W2133250609","https://openalex.org/W2139031153","https://openalex.org/W2142677441","https://openalex.org/W2146700739","https://openalex.org/W2160709036","https://openalex.org/W2173839706","https://openalex.org/W2174728072","https://openalex.org/W2182388272","https://openalex.org/W2469198586","https://openalex.org/W2535359146","https://openalex.org/W2581356531","https://openalex.org/W2765106570","https://openalex.org/W2799001871","https://openalex.org/W2889256647","https://openalex.org/W2902696731","https://openalex.org/W2913324528","https://openalex.org/W2978619376","https://openalex.org/W2985428643","https://openalex.org/W3005947729","https://openalex.org/W3021594640","https://openalex.org/W3147172531","https://openalex.org/W4235252000","https://openalex.org/W6631160967","https://openalex.org/W6679289121"],"related_works":["https://openalex.org/W1963782977","https://openalex.org/W1993191611","https://openalex.org/W4248655967","https://openalex.org/W2138520521","https://openalex.org/W2338363223","https://openalex.org/W2544870670","https://openalex.org/W3002912422","https://openalex.org/W1997399539","https://openalex.org/W4382866741","https://openalex.org/W4255428424"],"abstract_inverted_index":{"User-level":[0],"threads":[1,26],"have":[2],"been":[3],"widely":[4],"adopted":[5],"as":[6],"a":[7,28,64,99,103,113,136],"means":[8],"of":[9,17,23,80,84,98,112,116,142,153,165,183],"achieving":[10],"lightweight":[11],"concurrent":[12],"execution":[13,97],"without":[14,44],"the":[15,21,36,68,81,96,163,173,181],"costs":[16,22,70],"OS-level":[18],"threads.":[19,74],"Nevertheless,":[20],"managing":[24],"user-level":[25,73],"represent":[27],"performance":[29,177],"barrier":[30],"that":[31,78,91,157,161],"dictates":[32],"how":[33,121],"fine":[34],"grained":[35],"concurrency":[37],"exposed":[38],"by":[39],"an":[40,109],"application":[41],"can":[42],"be":[43],"incurring":[45],"significant":[46],"overheads;":[47],"this":[48],"in":[49,71],"turn":[50],"may":[51],"translate":[52],"into":[53,67],"insufficient":[54],"parallelism":[55],"to":[56,120],"exploit":[57],"highly":[58],"parallel":[59],"systems.":[60],"This":[61],"article":[62],"is":[63,156,185],"deep":[65],"dive":[66],"fundamental":[69],"implementing":[72],"We":[75,106],"first":[76],"identify":[77],"one":[79],"highest":[82],"sources":[83],"fork-join":[85],"overheads":[86],"stems":[87],"from":[88],"deviations,":[89],"events":[90],"incur":[92],"context":[93],"switching":[94],"during":[95],"thread":[100],"and":[101,129,139,167,178],"disrupt":[102],"run-to-completion":[104],"execution.":[105],"then":[107],"conduct":[108],"in-depth":[110],"investigation":[111],"wide":[114],"spectrum":[115],"methods":[117,144,160],"with":[118],"respect":[119],"they":[122],"handle":[123],"deviations":[124],"while":[125],"covering":[126],"both":[127],"parent-":[128],"child-first":[130],"scheduling":[131],"policies.":[132],"Our":[133],"methodology":[134],"involves":[135],"comprehensive":[137],"instruction-":[138],"cache-level":[140],"analysis":[141],"all":[143],"on":[145],"several":[146],"modern":[147],"CPU":[148],"architectures.":[149],"The":[150],"primary":[151],"finding":[152],"our":[154],"evaluation":[155],"dynamic":[158],"promotion":[159],"assume":[162],"absence":[164],"deviation":[166,184],"dynamically":[168],"provide":[169],"context-switching":[170],"support":[171],"offer":[172],"best":[174],"trade-off":[175],"between":[176],"capability":[179],"when":[180],"likelihood":[182],"low.":[186]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
