{"id":"https://openalex.org/W2916475468","doi":"https://doi.org/10.1145/3303084.3309488","title":"Don't Forget About Synchronization!","display_name":"Don't Forget About Synchronization!","publication_year":2019,"publication_date":"2019-02-17","ids":{"openalex":"https://openalex.org/W2916475468","doi":"https://doi.org/10.1145/3303084.3309488","mag":"2916475468"},"language":"en","primary_location":{"id":"doi:10.1145/3303084.3309488","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3303084.3309488","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3303084.3309488","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 10th International Workshop on Programming Models and Applications for Multicores and Manycores","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3303084.3309488","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075224001","display_name":"Jacob Nelson","orcid":"https://orcid.org/0000-0003-0791-5281"},"institutions":[{"id":"https://openalex.org/I186143895","display_name":"Lehigh University","ror":"https://ror.org/012afjb06","country_code":"US","type":"education","lineage":["https://openalex.org/I186143895"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jacob Nelson","raw_affiliation_strings":["Computer Science and Engineering, Lehigh University, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Lehigh University, USA","institution_ids":["https://openalex.org/I186143895"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060347832","display_name":"Roberto Palmieri","orcid":"https://orcid.org/0000-0002-1530-4088"},"institutions":[{"id":"https://openalex.org/I186143895","display_name":"Lehigh University","ror":"https://ror.org/012afjb06","country_code":"US","type":"education","lineage":["https://openalex.org/I186143895"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Roberto Palmieri","raw_affiliation_strings":["Computer Science and Engineering, Lehigh University, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Lehigh University, USA","institution_ids":["https://openalex.org/I186143895"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5075224001"],"corresponding_institution_ids":["https://openalex.org/I186143895"],"apc_list":null,"apc_paid":null,"fwci":1.7223,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.83069862,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"11","last_page":"20"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8940328359603882},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.6982375979423523},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6307542324066162},{"id":"https://openalex.org/keywords/graphics-processing-unit","display_name":"Graphics processing unit","score":0.6008833646774292},{"id":"https://openalex.org/keywords/massively-parallel","display_name":"Massively parallel","score":0.5905774235725403},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.5826930403709412},{"id":"https://openalex.org/keywords/concurrency","display_name":"Concurrency","score":0.5500973463058472},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.4969344437122345},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.49112650752067566},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.4737582802772522},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.457058846950531},{"id":"https://openalex.org/keywords/graphics-hardware","display_name":"Graphics hardware","score":0.42955300211906433},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.09088775515556335}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8940328359603882},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.6982375979423523},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6307542324066162},{"id":"https://openalex.org/C2779851693","wikidata":"https://www.wikidata.org/wiki/Q183484","display_name":"Graphics processing unit","level":2,"score":0.6008833646774292},{"id":"https://openalex.org/C190475519","wikidata":"https://www.wikidata.org/wiki/Q544384","display_name":"Massively parallel","level":2,"score":0.5905774235725403},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.5826930403709412},{"id":"https://openalex.org/C193702766","wikidata":"https://www.wikidata.org/wiki/Q1414548","display_name":"Concurrency","level":2,"score":0.5500973463058472},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.4969344437122345},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.49112650752067566},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.4737582802772522},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.457058846950531},{"id":"https://openalex.org/C18945957","wikidata":"https://www.wikidata.org/wiki/Q5597193","display_name":"Graphics hardware","level":3,"score":0.42955300211906433},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.09088775515556335},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3303084.3309488","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3303084.3309488","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3303084.3309488","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 10th International Workshop on Programming Models and Applications for Multicores and Manycores","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3303084.3309488","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3303084.3309488","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3303084.3309488","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 10th International Workshop on Programming Models and Applications for Multicores and Manycores","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.6499999761581421,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[{"id":"https://openalex.org/G1072749480","display_name":null,"funder_award_id":"FA9550-17","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"},{"id":"https://openalex.org/G1523888516","display_name":null,"funder_award_id":"FA9550-","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"},{"id":"https://openalex.org/G260750634","display_name":null,"funder_award_id":"FA9550-17-1","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"},{"id":"https://openalex.org/G3258049141","display_name":null,"funder_award_id":"FA9550-17-1-036","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"},{"id":"https://openalex.org/G5809100787","display_name":null,"funder_award_id":"FA9550","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"},{"id":"https://openalex.org/G7515358678","display_name":null,"funder_award_id":"FA9550-17-1-0367","funder_id":"https://openalex.org/F4320338279","funder_display_name":"Air Force Office of Scientific Research"}],"funders":[{"id":"https://openalex.org/F4320338279","display_name":"Air Force Office of Scientific Research","ror":"https://ror.org/011e9bt93"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2916475468.pdf","grobid_xml":"https://content.openalex.org/works/W2916475468.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W1624140875","https://openalex.org/W1625255723","https://openalex.org/W1790954942","https://openalex.org/W1982401581","https://openalex.org/W1984222112","https://openalex.org/W2014039063","https://openalex.org/W2028069406","https://openalex.org/W2033451123","https://openalex.org/W2041356909","https://openalex.org/W2080571439","https://openalex.org/W2101209730","https://openalex.org/W2112828875","https://openalex.org/W2138218143","https://openalex.org/W2150593711","https://openalex.org/W2150753219","https://openalex.org/W2153636750","https://openalex.org/W2155503253","https://openalex.org/W2163654949","https://openalex.org/W2168075869","https://openalex.org/W2168596788","https://openalex.org/W2415865954","https://openalex.org/W2513721464","https://openalex.org/W2563372635","https://openalex.org/W2626705819","https://openalex.org/W2794887017","https://openalex.org/W2805118380","https://openalex.org/W4229895907","https://openalex.org/W4230315356","https://openalex.org/W4233147525","https://openalex.org/W4237900079","https://openalex.org/W4240768087"],"related_works":["https://openalex.org/W2151046618","https://openalex.org/W1972148443","https://openalex.org/W1969233021","https://openalex.org/W2167646277","https://openalex.org/W2063573318","https://openalex.org/W2388314963","https://openalex.org/W3158047141","https://openalex.org/W1656096860","https://openalex.org/W2027443981","https://openalex.org/W2063372669"],"abstract_inverted_index":{"Heterogeneous":[0],"devices":[1],"are":[2,39,48],"becoming":[3],"necessary":[4],"components":[5],"of":[6,76,93,108,149],"high":[7,139],"performance":[8],"computing":[9],"infrastructures,":[10],"and":[11,104,125,131,141,151],"the":[12,27,32,52,118,123],"graphics":[13],"processing":[14],"unit":[15],"(GPU)":[16],"plays":[17],"an":[18],"important":[19],"role":[20],"in":[21],"this":[22,77,82],"landscape.":[23],"Given":[24],"a":[25],"problem,":[26],"established":[28],"approach":[29],"for":[30,144],"exploiting":[31],"GPU":[33,71,169],"is":[34,79],"to":[35,51,65,80,97,117,162],"design":[36,58,98],"solutions":[37,47,100,116],"that":[38,68,88,101,114],"parallel,":[40],"without":[41],"data":[42],"or":[43],"flow":[44],"dependencies.":[45],"These":[46],"then":[49],"offloaded":[50],"GPU's":[53],"massively":[54],"parallel":[55,99,126],"capability.":[56],"This":[57],"principle":[59],"(i.e.,":[60],"avoiding":[61],"contention)":[62],"often":[63],"leads":[64],"developing":[66],"applications":[67],"cannot":[69],"maximize":[70],"hardware":[72,109],"utilization.":[73],"The":[74],"goal":[75],"paper":[78],"challenge":[81],"common":[83],"belief":[84],"by":[85,158],"empirically":[86],"showing":[87],"allowing":[89],"even":[90],"simple":[91],"forms":[92],"synchronization":[94],"enables":[95],"programmers":[96],"admit":[102],"conflicts":[103],"achieve":[105],"better":[106],"utilization":[107],"parallelism.":[110],"Our":[111],"experience":[112],"shows":[113],"lock-based":[115],"k-means":[119],"clustering":[120],"problem":[121],"outperform":[122],"well-engineered":[124],"KMCUDA":[127],"on":[128],"both":[129],"synthetic":[130],"real":[132],"datasets;":[133],"averaging":[134],"8.4x":[135],"faster":[136,143],"runtimes":[137],"at":[138],"contention":[140],"8.1x":[142],"low":[145],"contention,":[146],"with":[147],"maximums":[148],"25.4x":[150],"74x,":[152],"respectively.":[153],"We":[154],"summarize":[155],"our":[156],"findings":[157],"identifying":[159],"two":[160],"guidelines":[161],"help":[163],"make":[164],"concurrency":[165],"effective":[166],"when":[167],"programming":[168],"applications.":[170]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
