{"id":"https://openalex.org/W2798640261","doi":"https://doi.org/10.1145/3192366.3192368","title":"CURD: a dynamic CUDA race detector","display_name":"CURD: a dynamic CUDA race detector","publication_year":2018,"publication_date":"2018-06-11","ids":{"openalex":"https://openalex.org/W2798640261","doi":"https://doi.org/10.1145/3192366.3192368","mag":"2798640261"},"language":"en","primary_location":{"id":"doi:10.1145/3192366.3192368","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3192366.3192368","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3192366.3192368","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 39th ACM SIGPLAN Conference on Programming Language Design and Implementation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3192366.3192368","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022471948","display_name":"Yuanfeng Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I36788626","display_name":"California University of Pennsylvania","ror":"https://ror.org/01spssf70","country_code":"US","type":"education","lineage":["https://openalex.org/I36788626"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yuanfeng Peng","raw_affiliation_strings":["University of Pennsylvania, USA"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania, USA","institution_ids":["https://openalex.org/I36788626"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077691647","display_name":"Vinod Grover","orcid":null},"institutions":[{"id":"https://openalex.org/I4210127875","display_name":"Nvidia (United States)","ror":"https://ror.org/03jdj4y14","country_code":"US","type":"company","lineage":["https://openalex.org/I4210127875"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vinod Grover","raw_affiliation_strings":["NVIDIA, USA"],"affiliations":[{"raw_affiliation_string":"NVIDIA, USA","institution_ids":["https://openalex.org/I4210127875"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031917049","display_name":"Joseph Devietti","orcid":"https://orcid.org/0000-0002-9330-7233"},"institutions":[{"id":"https://openalex.org/I36788626","display_name":"California University of Pennsylvania","ror":"https://ror.org/01spssf70","country_code":"US","type":"education","lineage":["https://openalex.org/I36788626"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Joseph Devietti","raw_affiliation_strings":["University of Pennsylvania, USA"],"affiliations":[{"raw_affiliation_string":"University of Pennsylvania, USA","institution_ids":["https://openalex.org/I36788626"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5022471948"],"corresponding_institution_ids":["https://openalex.org/I36788626"],"apc_list":null,"apc_paid":null,"fwci":2.7772,"has_fulltext":true,"cited_by_count":19,"citation_normalized_percentile":{"value":0.90552432,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"390","last_page":"403"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.821248471736908},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.8074763417243958},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7713059186935425},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.7291715145111084},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6190732717514038},{"id":"https://openalex.org/keywords/debugging","display_name":"Debugging","score":0.541049599647522},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.43149787187576294},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2496648132801056}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.821248471736908},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.8074763417243958},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7713059186935425},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.7291715145111084},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6190732717514038},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.541049599647522},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.43149787187576294},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2496648132801056},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3192366.3192368","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3192366.3192368","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3192366.3192368","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 39th ACM SIGPLAN Conference on Programming Language Design and Implementation","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3192366.3192368","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3192366.3192368","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3192366.3192368","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 39th ACM SIGPLAN Conference on Programming Language Design and Implementation","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1713430219","display_name":null,"funder_award_id":"XPS-1337174","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2798640261.pdf","grobid_xml":"https://content.openalex.org/works/W2798640261.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W5651039","https://openalex.org/W1487375638","https://openalex.org/W1817344819","https://openalex.org/W1866093455","https://openalex.org/W1971463841","https://openalex.org/W1972544179","https://openalex.org/W1972663160","https://openalex.org/W1979114612","https://openalex.org/W2022457591","https://openalex.org/W2025819261","https://openalex.org/W2041470524","https://openalex.org/W2043003055","https://openalex.org/W2061239425","https://openalex.org/W2072419942","https://openalex.org/W2076960126","https://openalex.org/W2078197548","https://openalex.org/W2080592089","https://openalex.org/W2093753124","https://openalex.org/W2105391037","https://openalex.org/W2105794846","https://openalex.org/W2110592167","https://openalex.org/W2115968584","https://openalex.org/W2117444998","https://openalex.org/W2121717408","https://openalex.org/W2121816623","https://openalex.org/W2149538119","https://openalex.org/W2150602145","https://openalex.org/W2153174073","https://openalex.org/W2156138494","https://openalex.org/W2156831150","https://openalex.org/W2167744164","https://openalex.org/W2167995056","https://openalex.org/W2169880332","https://openalex.org/W2170200862","https://openalex.org/W2199020522","https://openalex.org/W2234512370","https://openalex.org/W2273440736","https://openalex.org/W2556205142","https://openalex.org/W2589311469","https://openalex.org/W2731956051","https://openalex.org/W2951135776","https://openalex.org/W4248655060"],"related_works":["https://openalex.org/W3194833114","https://openalex.org/W4205868343","https://openalex.org/W66594024","https://openalex.org/W2011840458","https://openalex.org/W3213381848","https://openalex.org/W2017587301","https://openalex.org/W2005148983","https://openalex.org/W2030707850","https://openalex.org/W3038415719","https://openalex.org/W2244094767"],"abstract_inverted_index":{"As":[0],"GPUs":[1],"have":[2],"become":[3,15],"an":[4,119,150],"integral":[5],"part":[6],"of":[7,23,26,61,93,154,176],"nearly":[8],"every":[9],"pro-":[10,79],"cessor,":[11],"GPU":[12,18,78],"programming":[13,19],"has":[14],"increasingly":[16],"popular.":[17],"requires":[20],"a":[21,66,90,130,172],"combination":[22],"extreme":[24],"levels":[25],"parallelism":[27],"and":[28,51,115,132,191],"low-level":[29],"programming,":[30],"making":[31],"it":[32],"easy":[33],"for":[34],"concurrency":[35],"bugs":[36,46,186],"such":[37],"as":[38],"data":[39,75,94,109],"races":[40,76,95,110,181],"to":[41,54,57,73,100,137],"arise.":[42],"These":[43],"con-":[44],"currency":[45],"can":[47,107],"be":[48],"extremely":[49],"subtle":[50],"di":[52],"cult":[53],"debug":[55],"due":[56],"the":[58,126],"massive":[59],"numbers":[60],"threads":[62],"running":[63],"concurrently":[64],"on":[65,89,112,125],"modern":[67],"GPU.":[68],"While":[69],"some":[70],"tools":[71],"exist":[72],"detect":[74,108],"in":[77,96,129,187,192],"grams,":[80],"they":[81],"are":[82],"often":[83],"prohibitively":[84],"slow":[85],"or":[86],"focused":[87],"only":[88],"small":[91],"class":[92,175],"shared":[97,114],"memory.":[98],"Compared":[99],"prior":[101],"work,":[102],"our":[103,183],"race":[104,121,167],"detector,":[105,168],"CURD,":[106],"precisely":[111],"both":[113],"global":[116],"memory,":[117],"selects":[118],"appropriate":[120],"detection":[122],"algorithm":[123],"based":[124],"synchronization":[127],"used":[128],"program,":[131],"utilizes":[133],"efficient":[134],"compiler":[135],"instrumentation":[136],"reduce":[138],"performance":[139],"overheads.":[140],"Across":[141],"53":[142],"benchmarks,":[143,184],"we":[144],"find":[145],"that":[146],"using":[147],"CURD":[148,160,178],"incurs":[149],"aver-":[151],"age":[152],"slowdown":[153],"just":[155],"2.88x":[156],"over":[157],"native":[158],"execution.":[159],"is":[161],"2.1x":[162],"faster":[163],"than":[164],"Nvidia\u2019s":[165],"CUDA-Racecheck":[166],"de-":[169],"spite":[170],"detecting":[171],"much":[173],"broader":[174],"races.":[177],"finds":[179],"35":[180],"across":[182],"including":[185],"established":[188],"benchmark":[189],"suites":[190],"sample":[193],"programs":[194],"from":[195],"Nvidia.":[196]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
