{"id":"https://openalex.org/W4285021184","doi":"https://doi.org/10.1145/3547301","title":"Adaptive Contention Management for Fine-Grained Synchronization on Commodity GPUs","display_name":"Adaptive Contention Management for Fine-Grained Synchronization on Commodity GPUs","publication_year":2022,"publication_date":"2022-07-11","ids":{"openalex":"https://openalex.org/W4285021184","doi":"https://doi.org/10.1145/3547301"},"language":"en","primary_location":{"id":"doi:10.1145/3547301","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3547301","pdf_url":null,"source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1145/3547301","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101688579","display_name":"Lan Gao","orcid":"https://orcid.org/0000-0001-5637-9417"},"institutions":[{"id":"https://openalex.org/I96852419","display_name":"Capital Normal University","ror":"https://ror.org/005edt527","country_code":"CN","type":"education","lineage":["https://openalex.org/I96852419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lan Gao","raw_affiliation_strings":["Capital Normal University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-5637-9417","affiliations":[{"raw_affiliation_string":"Capital Normal University, Beijing, China","institution_ids":["https://openalex.org/I96852419"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100378697","display_name":"Jing Wang","orcid":"https://orcid.org/0000-0003-3653-7013"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Wang","raw_affiliation_strings":["Renmin University of China, Beijing"],"raw_orcid":"https://orcid.org/0000-0003-3653-7013","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101447392","display_name":"Weigong Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I96852419","display_name":"Capital Normal University","ror":"https://ror.org/005edt527","country_code":"CN","type":"education","lineage":["https://openalex.org/I96852419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weigong Zhang","raw_affiliation_strings":["Capital Normal University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3969-5607","affiliations":[{"raw_affiliation_string":"Capital Normal University, Beijing, China","institution_ids":["https://openalex.org/I96852419"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4666,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.59318996,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"19","issue":"4","first_page":"1","last_page":"21"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9098672866821289},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7076045870780945},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.6993047595024109},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6132955551147461},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.4466986060142517},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.340205579996109},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2738557755947113},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.09352678060531616}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9098672866821289},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7076045870780945},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.6993047595024109},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6132955551147461},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4466986060142517},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.340205579996109},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2738557755947113},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.09352678060531616},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3547301","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3547301","pdf_url":null,"source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3547301","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3547301","pdf_url":null,"source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1675130169","https://openalex.org/W1964332568","https://openalex.org/W1968775993","https://openalex.org/W1988800505","https://openalex.org/W2041356909","https://openalex.org/W2047060659","https://openalex.org/W2049875313","https://openalex.org/W2050501247","https://openalex.org/W2053744175","https://openalex.org/W2065771339","https://openalex.org/W2067441262","https://openalex.org/W2079038734","https://openalex.org/W2081583983","https://openalex.org/W2085598418","https://openalex.org/W2090584832","https://openalex.org/W2096661534","https://openalex.org/W2098505406","https://openalex.org/W2099865945","https://openalex.org/W2101209730","https://openalex.org/W2107164729","https://openalex.org/W2122106801","https://openalex.org/W2138218143","https://openalex.org/W2142444503","https://openalex.org/W2151887234","https://openalex.org/W2152956697","https://openalex.org/W2156831150","https://openalex.org/W2163654949","https://openalex.org/W2171399035","https://openalex.org/W2198138176","https://openalex.org/W2235785597","https://openalex.org/W2335340700","https://openalex.org/W2409690919","https://openalex.org/W2415865954","https://openalex.org/W2576829774","https://openalex.org/W2611473431","https://openalex.org/W2626705819","https://openalex.org/W2769311538","https://openalex.org/W2794802501","https://openalex.org/W2794887017","https://openalex.org/W2929410821","https://openalex.org/W2990070523","https://openalex.org/W4239826705"],"related_works":["https://openalex.org/W1509211761","https://openalex.org/W2391299576","https://openalex.org/W2133693067","https://openalex.org/W1531488649","https://openalex.org/W3037767301","https://openalex.org/W1585350690","https://openalex.org/W2366027386","https://openalex.org/W2582456645","https://openalex.org/W2479014312","https://openalex.org/W1583465708"],"abstract_inverted_index":{"As":[0],"more":[1],"emerging":[2],"applications":[3,126],"are":[4],"moving":[5],"to":[6,50,81,101],"GPUs,":[7],"fine-grained":[8,128],"synchronization":[9,24,104],"has":[10],"become":[11],"imperative.":[12],"However,":[13],"their":[14],"performance":[15],"can":[16],"be":[17],"severely":[18],"impaired":[19],"in":[20],"case":[21],"of":[22,37,86,93,110,125],"frequent":[23,103],"failures":[25,105],"caused":[26],"by":[27,152],"high":[28],"data":[29],"contention.":[30],"Differently":[31],"from":[32],"CPUs,":[33],"GPUs":[34,121],"own":[35],"thousands":[36],"hardware":[38,79],"threads":[39,45],"and":[40,76,115,144],"adopt":[41],"single":[42],"instruction":[43],"multiple":[44],"paradigm,":[46],"making":[47],"it":[48],"impractical":[49],"deploy":[51],"the":[52,84,91,108,116,146],"CPU":[53],"contention":[54,98,138],"management":[55,99,139],"mechanisms":[56],"directly":[57],"on":[58,119,134,154],"GPUs.":[59],"In":[60],"this":[61],"article,":[62],"we":[63,95],"design":[64],"a":[65,97,123,141],"Software":[66],"Warp":[67],"Controlling":[68],"Framework":[69],"(SWCF),":[70],"which":[71],"employs":[72],"producer-consumer":[73],"execution":[74,85],"model":[75],"leverages":[77],"GPU":[78,136,148],"barriers":[80],"dynamically":[82],"control":[83],"warps":[87],"at":[88],"runtime.":[89],"On":[90],"basis":[92],"SWCF,":[94],"propose":[96],"strategy":[100,118],"decrease":[102],"while":[106],"avoiding":[107],"over-reducing":[109],"parallelism.":[111],"We":[112],"evaluate":[113],"SWCF":[114],"proposed":[117],"commodity":[120],"using":[122],"set":[124],"with":[127],"synchronization.":[129],"The":[130],"results":[131],"show":[132],"that":[133],"V100":[135],"our":[137],"achieves":[140],"4.7X":[142],"speedup":[143],"outperforms":[145],"conventional":[147],"software":[149],"backoff":[150],"solution":[151],"42%":[153],"average.":[155]},"counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
