{"id":"https://openalex.org/W2990070523","doi":"https://doi.org/10.1109/tpds.2019.2955705","title":"Thread-Level Locking for SIMT Architectures","display_name":"Thread-Level Locking for SIMT Architectures","publication_year":2019,"publication_date":"2019-11-26","ids":{"openalex":"https://openalex.org/W2990070523","doi":"https://doi.org/10.1109/tpds.2019.2955705","mag":"2990070523"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2019.2955705","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2019.2955705","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101688579","display_name":"Lan Gao","orcid":"https://orcid.org/0000-0001-5637-9417"},"institutions":[{"id":"https://openalex.org/I96852419","display_name":"Capital Normal University","ror":"https://ror.org/005edt527","country_code":"CN","type":"education","lineage":["https://openalex.org/I96852419"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lan Gao","raw_affiliation_strings":["Beijing Key Laboratory of Electronic System Reliability and Prognostics, College of Information Engineering, Capital Normal University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Electronic System Reliability and Prognostics, College of Information Engineering, Capital Normal University, Beijing, China","institution_ids":["https://openalex.org/I96852419"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102900140","display_name":"Yunlong Xu","orcid":"https://orcid.org/0000-0003-4727-0676"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunlong Xu","raw_affiliation_strings":["Xi'an Jiaotong University"],"affiliations":[{"raw_affiliation_string":"Xi'an Jiaotong University","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431390","display_name":"Rui Wang","orcid":"https://orcid.org/0000-0003-2741-6033"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Wang","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074183877","display_name":"Zhongzhi Luan","orcid":"https://orcid.org/0000-0002-7186-0556"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhongzhi Luan","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048614443","display_name":"Zhibin Yu","orcid":"https://orcid.org/0000-0001-8067-9612"},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhibin Yu","raw_affiliation_strings":["Chinese Academy of Sciences, Shenzhen Institutes of Advanced Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Shenzhen Institutes of Advanced Technology, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079362609","display_name":"Depei Qian","orcid":"https://orcid.org/0000-0002-5382-1473"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Depei Qian","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101688579"],"corresponding_institution_ids":["https://openalex.org/I96852419"],"apc_list":null,"apc_paid":null,"fwci":0.4815,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.62927211,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"31","issue":"5","first_page":"1121","last_page":"1136"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.797917366027832},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.747933030128479},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6476792097091675},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2390030026435852}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.797917366027832},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.747933030128479},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6476792097091675},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2390030026435852}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2019.2955705","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2019.2955705","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3695495462","display_name":null,"funder_award_id":"Z181100006218093","funder_id":"https://openalex.org/F4320334978","funder_display_name":"Beijing Nova Program"},{"id":"https://openalex.org/G4853972368","display_name":null,"funder_award_id":"61772350","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5903059524","display_name":null,"funder_award_id":"61672511","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6122643609","display_name":null,"funder_award_id":"KYJJ2018008","funder_id":"https://openalex.org/F4320327539","funder_display_name":"Beijing Innovation Center for Future Chip"},{"id":"https://openalex.org/G6322973505","display_name":null,"funder_award_id":"61732002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6385625218","display_name":null,"funder_award_id":"61702495","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320327539","display_name":"Beijing Innovation Center for Future Chip","ror":null},{"id":"https://openalex.org/F4320334978","display_name":"Beijing Nova Program","ror":"https://ror.org/034k14f91"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W164384110","https://openalex.org/W1715366078","https://openalex.org/W1826955156","https://openalex.org/W1969549682","https://openalex.org/W1974165977","https://openalex.org/W1981393723","https://openalex.org/W1985229168","https://openalex.org/W2039767911","https://openalex.org/W2048441570","https://openalex.org/W2101209730","https://openalex.org/W2101397060","https://openalex.org/W2117689653","https://openalex.org/W2122106801","https://openalex.org/W2138218143","https://openalex.org/W2150851481","https://openalex.org/W2163654949","https://openalex.org/W2165116875","https://openalex.org/W2227386419","https://openalex.org/W2254317906","https://openalex.org/W2335340700","https://openalex.org/W2409690919","https://openalex.org/W2415865954","https://openalex.org/W2545744347","https://openalex.org/W2563372635","https://openalex.org/W2611473431","https://openalex.org/W2736285633","https://openalex.org/W2751581470","https://openalex.org/W2769311538","https://openalex.org/W2783144320","https://openalex.org/W2794802501","https://openalex.org/W2794887017","https://openalex.org/W3144200734","https://openalex.org/W4238433345","https://openalex.org/W4239826705","https://openalex.org/W4245867598","https://openalex.org/W6637912555","https://openalex.org/W6689509850","https://openalex.org/W6691725984","https://openalex.org/W6748055782"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2023832055","https://openalex.org/W2082485924"],"abstract_inverted_index":{"As":[0],"more":[1],"emerging":[2],"applications":[3],"are":[4],"moving":[5],"to":[6,30,38,60,67,110,168,193],"GPUs,":[7],"thread-level":[8,23,40,52,92],"synchronization":[9,36,41,53,146,218],"has":[10],"become":[11],"a":[12,50,91,162,175,239],"requirement.":[13],"However,":[14],"GPUs":[15,59],"only":[16],"provide":[17],"warp-level":[18],"and":[19,77,102,130,165,205,233],"thread-block-level":[20],"rather":[21],"than":[22],"synchronization.":[24],"Moreover,":[25,179],"it":[26,86,109,180],"is":[27],"highly":[28],"possible":[29],"cause":[31],"live-locks":[32],"by":[33,84,156,230,248],"using":[34],"CPU":[35,131,235,243],"mechanisms":[37],"implement":[39,68,111],"for":[42,58,96,147],"GPUs.":[43,98],"In":[44,223],"this":[45],"article,":[46],"we":[47,89,107],"first":[48],"propose":[49],"software-based":[51],"mechanism":[54],"called":[55],"lock":[56,70],"stealing":[57,71],"avoid":[61],"live-locks.":[62],"We":[63,116],"then":[64],"describe":[65],"how":[66],"our":[69],"algorithm":[72],"in":[73],"mutual":[74],"exclusive":[75],"locks":[76,79],"readers-writer":[78],"with":[80,142,200,209,214,244],"high":[81],"performance.":[82],"Finally,":[83],"putting":[85],"all":[87],"together,":[88],"develop":[90],"locking":[93],"library":[94],"(TLLL)":[95],"commercial":[97],"To":[99],"evaluate":[100],"TLLL":[101,118,152,225],"show":[103,139],"its":[104],"general":[105],"applicability,":[106],"use":[108],"six":[112],"widely":[113],"used":[114],"programs.":[115],"compare":[117],"against":[119],"the":[120,143,154,183,197,201,206,210,216,227,234],"state-of-the-art":[121],"ad-hoc":[122,144,217],"GPU":[123,125,145,199,208,228],"synchronization,":[124],"software":[126],"transactional":[127,133],"memory":[128,134,185,189],"(STM),":[129],"hardware":[132,246],"(HTM),":[135],"respectively.":[136],"The":[137],"results":[138],"that,":[140],"compared":[141],"Delaunay":[148],"mesh":[149,203,212],"refinement":[150],"(DMR),":[151],"improves":[153],"performance":[155,172],"22":[157],"percent":[158,170,250],"on":[159,161,174,196,238,251],"average":[160],"GTX970":[163,198],"GPU,":[164],"shows":[166],"up":[167],"11":[169],"of":[171],"improvement":[173],"Volta":[176],"V100":[177,207],"GPU.":[178],"significantly":[181],"reduces":[182],"required":[184],"size.":[186],"Such":[187],"low":[188],"consumption":[190],"enables":[191],"DMR":[192],"successfully":[194],"run":[195,221],"10-million":[202],"size,":[204,213],"40-million":[211],"which":[215],"can":[219],"not":[220],"successfully.":[222],"addition,":[224],"outperforms":[226],"STM":[229],"65":[231],"percent,":[232],"HTM":[236],"(running":[237],"Xeon":[240],"E5-2620":[241],"v4":[242],"16":[245],"threads)":[247],"43":[249],"average.":[252]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
