{"id":"https://openalex.org/W2120753531","doi":"https://doi.org/10.1109/ipdps.2008.4536358","title":"Facilitating efficient synchronization of asymmetric threads on hyper-threaded processors","display_name":"Facilitating efficient synchronization of asymmetric threads on hyper-threaded processors","publication_year":2008,"publication_date":"2008-04-01","ids":{"openalex":"https://openalex.org/W2120753531","doi":"https://doi.org/10.1109/ipdps.2008.4536358","mag":"2120753531"},"language":"en","primary_location":{"id":"doi:10.1109/ipdps.2008.4536358","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2008.4536358","pdf_url":null,"source":{"id":"https://openalex.org/S4210174069","display_name":"Proceedings - IEEE International Parallel and Distributed Processing Symposium","issn_l":"1530-2075","issn":["1530-2075"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 IEEE International Symposium on Parallel and Distributed Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://doi.org/10.1109/IPDPS.2008.4536358","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026690826","display_name":"Nikos Anastopoulos","orcid":null},"institutions":[{"id":"https://openalex.org/I174458059","display_name":"National Technical University of Athens","ror":"https://ror.org/03cx6bg69","country_code":"GR","type":"education","lineage":["https://openalex.org/I174458059"]},{"id":"https://openalex.org/I200777214","display_name":"National and Kapodistrian University of Athens","ror":"https://ror.org/04gnjpq42","country_code":"GR","type":"education","lineage":["https://openalex.org/I200777214"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Nikos Anastopoulos","raw_affiliation_strings":["School of Electrical and Computer Engineering, Computing Systems Laboratory, National and Technical University of Athens, Greece","Sch. of Electr. & Comput. Eng. Comput. Syst. Lab., Nat. Tech. Univ. of Athens, Athens"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Computing Systems Laboratory, National and Technical University of Athens, Greece","institution_ids":["https://openalex.org/I174458059"]},{"raw_affiliation_string":"Sch. of Electr. & Comput. Eng. Comput. Syst. Lab., Nat. Tech. Univ. of Athens, Athens","institution_ids":["https://openalex.org/I200777214"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023526161","display_name":"Nectarios Koziris","orcid":"https://orcid.org/0000-0002-4890-8427"},"institutions":[{"id":"https://openalex.org/I200777214","display_name":"National and Kapodistrian University of Athens","ror":"https://ror.org/04gnjpq42","country_code":"GR","type":"education","lineage":["https://openalex.org/I200777214"]},{"id":"https://openalex.org/I174458059","display_name":"National Technical University of Athens","ror":"https://ror.org/03cx6bg69","country_code":"GR","type":"education","lineage":["https://openalex.org/I174458059"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Nectarios Koziris","raw_affiliation_strings":["School of Electrical and Computer Engineering, Computing Systems Laboratory, National and Technical University of Athens, Greece","Sch. of Electr. & Comput. Eng. Comput. Syst. Lab., Nat. Tech. Univ. of Athens, Athens"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Computing Systems Laboratory, National and Technical University of Athens, Greece","institution_ids":["https://openalex.org/I174458059"]},{"raw_affiliation_string":"Sch. of Electr. & Comput. Eng. Comput. Syst. Lab., Nat. Tech. Univ. of Athens, Athens","institution_ids":["https://openalex.org/I200777214"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5026690826"],"corresponding_institution_ids":["https://openalex.org/I174458059","https://openalex.org/I200777214"],"apc_list":null,"apc_paid":null,"fwci":2.1261,"has_fulltext":false,"cited_by_count":25,"citation_normalized_percentile":{"value":0.88589939,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/posix-threads","display_name":"POSIX Threads","score":0.967119574546814},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8703843355178833},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.7764407396316528},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6749570369720459},{"id":"https://openalex.org/keywords/synchronizing","display_name":"Synchronizing","score":0.6321608424186707},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.5812650322914124},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.5804396271705627},{"id":"https://openalex.org/keywords/semaphore","display_name":"Semaphore","score":0.5038809180259705},{"id":"https://openalex.org/keywords/multithreading","display_name":"Multithreading","score":0.47371906042099},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.42236363887786865},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4218409061431885},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.4143780469894409},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.413105309009552},{"id":"https://openalex.org/keywords/speculative-multithreading","display_name":"Speculative multithreading","score":0.4110383987426758},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.31380242109298706},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.146424800157547}],"concepts":[{"id":"https://openalex.org/C41138395","wikidata":"https://www.wikidata.org/wiki/Q928112","display_name":"POSIX Threads","level":3,"score":0.967119574546814},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8703843355178833},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.7764407396316528},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6749570369720459},{"id":"https://openalex.org/C162932704","wikidata":"https://www.wikidata.org/wiki/Q1058791","display_name":"Synchronizing","level":3,"score":0.6321608424186707},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.5812650322914124},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.5804396271705627},{"id":"https://openalex.org/C95203288","wikidata":"https://www.wikidata.org/wiki/Q221682","display_name":"Semaphore","level":2,"score":0.5038809180259705},{"id":"https://openalex.org/C201410400","wikidata":"https://www.wikidata.org/wiki/Q1064412","display_name":"Multithreading","level":3,"score":0.47371906042099},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.42236363887786865},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4218409061431885},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.4143780469894409},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.413105309009552},{"id":"https://openalex.org/C15296174","wikidata":"https://www.wikidata.org/wiki/Q7575343","display_name":"Speculative multithreading","level":4,"score":0.4110383987426758},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.31380242109298706},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.146424800157547},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C761482","wikidata":"https://www.wikidata.org/wiki/Q118093","display_name":"Transmission (telecommunications)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ipdps.2008.4536358","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2008.4536358","pdf_url":null,"source":{"id":"https://openalex.org/S4210174069","display_name":"Proceedings - IEEE International Parallel and Distributed Processing Symposium","issn_l":"1530-2075","issn":["1530-2075"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 IEEE International Symposium on Parallel and Distributed Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:dspace.lib.ntua.gr:123456789/32247","is_oa":true,"landing_page_url":"http://doi.org/10.1109/IPDPS.2008.4536358","pdf_url":null,"source":{"id":"https://openalex.org/S4377196837","display_name":"DSpace - NTUA (National Technical University of Athens)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I174458059","host_organization_name":"National Technical University of Athens","host_organization_lineage":["https://openalex.org/I174458059"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IPDPS Miami 2008 - Proceedings of the 22nd IEEE International Parallel and Distributed Processing Symposium, Program and CD-ROM","raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"pmh:oai:dspace.lib.ntua.gr:123456789/32247","is_oa":true,"landing_page_url":"http://doi.org/10.1109/IPDPS.2008.4536358","pdf_url":null,"source":{"id":"https://openalex.org/S4377196837","display_name":"DSpace - NTUA (National Technical University of Athens)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I174458059","host_organization_name":"National Technical University of Athens","host_organization_lineage":["https://openalex.org/I174458059"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IPDPS Miami 2008 - Proceedings of the 22nd IEEE International Parallel and Distributed Processing Symposium, Program and CD-ROM","raw_type":"info:eu-repo/semantics/conferenceObject"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth","score":0.5699999928474426}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1555915743","https://openalex.org/W1982011377","https://openalex.org/W2116020886","https://openalex.org/W2120230074","https://openalex.org/W2131498141","https://openalex.org/W2155010932","https://openalex.org/W2170582961","https://openalex.org/W2184804519","https://openalex.org/W2249344705","https://openalex.org/W2725179571","https://openalex.org/W3142147837","https://openalex.org/W4231131543","https://openalex.org/W4240436476","https://openalex.org/W6682926681","https://openalex.org/W6792903772"],"related_works":["https://openalex.org/W2365741265","https://openalex.org/W2098322082","https://openalex.org/W2914044836","https://openalex.org/W2369027488","https://openalex.org/W2381891087","https://openalex.org/W2368907619","https://openalex.org/W4294310504","https://openalex.org/W1999755551","https://openalex.org/W2765149243","https://openalex.org/W4283366496"],"abstract_inverted_index":{"So":[0],"far,":[1],"the":[2,50,97,114,118,153,165],"privileged":[3],"instructions":[4,29,55],"MONITOR":[5],"and":[6,65,87,127,129,159,189,212,239],"MWAIT":[7],"introduced":[8],"with":[9,90],"Intel":[10],"Prescott":[11],"core,":[12],"have":[13],"been":[14],"used":[15,136],"mostly":[16],"for":[17,34,56,170,196],"inter-thread":[18,172],"synchronization":[19,38,148],"in":[20,37,102,207,214],"operating":[21],"systems":[22],"code.":[23],"In":[24,45,174],"a":[25,31,43,74,103,139,161,193,208],"hyper-threaded":[26,63],"processor,":[27],"these":[28,54,100],"offer":[30],"\"performance-optimized\"":[32],"way":[33],"threads":[35,59,200],"involved":[36],"events":[39],"to":[40,83,146,187,192,232,237,241,244],"wait":[41,86],"on":[42,62,184,220],"condition.":[44],"this":[46,224],"work,":[47],"we":[48,72,95,108,130,142,151,163,203],"explore":[49],"potential":[51],"of":[52,99,113,167,176,199],"using":[53,160],"synchronizing":[57],"application":[58],"that":[60,116],"execute":[61],"processors,":[64],"are":[66],"characterized":[67],"by":[68],"workload":[69],"asymmetry.":[70,201],"Initially,":[71],"propose":[73],"framework":[75],"through":[76],"which":[77],"one":[78],"can":[79],"use":[80,143],"MON-":[81],"ITOR/MWAIT":[82],"build":[84,147],"condition":[85],"notification":[88],"primitives,":[89],"minimal":[91],"kernel":[92],"involvement.":[93],"Then,":[94],"evaluate":[96,164],"efficiency":[98,166],"primitives":[101,115,145],"bottom-up":[104],"manner:":[105],"at":[106],"first,":[107],"quantify":[109],"certain":[110],"performance":[111,155,183,235],"aspects":[112],"reflect":[117],"execution":[119,226],"model":[120],"under":[121],"consideration,":[122],"such":[123],"as":[124,157],"resource":[125],"consumption":[126],"responsiveness,":[128],"compare":[131],"them":[132],"against":[133],"other":[134],"commonly":[135],"implementations.":[137],"As":[138],"further":[140],"step,":[141],"our":[144,168,178,205,228],"barriers.":[149,246],"Again,":[150],"examine":[152],"same":[154],"issues":[156],"before,":[158],"pseudo-benchmark":[162],"implementation":[169,229],"fine-grained":[171],"synchronization.":[173],"terms":[175],"throughput,":[177],"barriers":[179,206],"yielded":[180],"12%":[181],"better":[182,234],"average":[185],"compared":[186,191,236,243],"Pthreads,":[188,238],"26%":[190],"spin-loops-based":[194,245],"implementation,":[195],"varying":[197],"levels":[198],"Finally,":[202],"test":[204],"real-":[209],"world":[210],"scenario,":[211],"specifically,":[213],"applying":[215],"thread-level":[216],"Speculative":[217],"Pre":[218],"computation":[219],"four":[221],"applications.":[222],"For":[223],"multithreaded":[225],"scheme,":[227],"provided":[230],"up":[231,240],"7%":[233],"40%":[242]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":6},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
