{"id":"https://openalex.org/W4406164024","doi":"https://doi.org/10.1109/scw63240.2024.00032","title":"Compiler-Aided Correctness Checking of CUDA-Aware MPI Applications","display_name":"Compiler-Aided Correctness Checking of CUDA-Aware MPI Applications","publication_year":2024,"publication_date":"2024-11-17","ids":{"openalex":"https://openalex.org/W4406164024","doi":"https://doi.org/10.1109/scw63240.2024.00032"},"language":"en","primary_location":{"id":"doi:10.1109/scw63240.2024.00032","is_oa":false,"landing_page_url":"https://doi.org/10.1109/scw63240.2024.00032","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SC24-W: Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058127608","display_name":"Alexander H\u00fcck","orcid":"https://orcid.org/0000-0003-1931-773X"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Alexander H\u00fcck","raw_affiliation_strings":["Technical University Darmstadt,Darmstadt,Germany"],"affiliations":[{"raw_affiliation_string":"Technical University Darmstadt,Darmstadt,Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115807672","display_name":"Tim Ziegler","orcid":"https://orcid.org/0000-0002-8720-0181"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tim Ziegler","raw_affiliation_strings":["Technical University Darmstadt,Darmstadt,Germany"],"affiliations":[{"raw_affiliation_string":"Technical University Darmstadt,Darmstadt,Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065295830","display_name":"Simon Schwitanski","orcid":"https://orcid.org/0000-0001-7121-7205"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Simon Schwitanski","raw_affiliation_strings":["RWTH Aachen University,Aachen,Germany"],"affiliations":[{"raw_affiliation_string":"RWTH Aachen University,Aachen,Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044273470","display_name":"Joachim Jenke","orcid":"https://orcid.org/0000-0003-0640-8966"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Joachim Jenke","raw_affiliation_strings":["RWTH Aachen University,Aachen,Germany"],"affiliations":[{"raw_affiliation_string":"RWTH Aachen University,Aachen,Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020597086","display_name":"Christian Bischof","orcid":"https://orcid.org/0000-0003-2711-3032"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christian Bischof","raw_affiliation_strings":["Technical University Darmstadt,Darmstadt,Germany"],"affiliations":[{"raw_affiliation_string":"Technical University Darmstadt,Darmstadt,Germany","institution_ids":["https://openalex.org/I31512782"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5058127608"],"corresponding_institution_ids":["https://openalex.org/I31512782"],"apc_list":null,"apc_paid":null,"fwci":0.5186,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.69116896,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"204","last_page":"213"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11424","display_name":"Security and Verification in Computing","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11005","display_name":"Radiation Effects in Electronics","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.856421709060669},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.808186948299408},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.7818039059638977},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.7420787215232849},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5819071531295776},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.4463905394077301},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.38126862049102783},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.3793092370033264}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.856421709060669},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.808186948299408},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.7818039059638977},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.7420787215232849},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5819071531295776},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4463905394077301},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.38126862049102783},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.3793092370033264}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/scw63240.2024.00032","is_oa":false,"landing_page_url":"https://doi.org/10.1109/scw63240.2024.00032","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SC24-W: Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"},{"id":"pmh:oai:tubiblio.ulb.tu-darmstadt.de:153004","is_oa":false,"landing_page_url":"http://tubiblio.ulb.tu-darmstadt.de/view/person/H=FCck=3AAlexander=3A=3A.html>","pdf_url":null,"source":{"id":"https://openalex.org/S4377196390","display_name":"TUbilio (Technical University of Darmstadt)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I31512782","host_organization_name":"Technische Universit\u00e4t Darmstadt","host_organization_lineage":["https://openalex.org/I31512782"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"NonPeerReviewed"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W16395633","https://openalex.org/W250945742","https://openalex.org/W1565978235","https://openalex.org/W1825216778","https://openalex.org/W2025388037","https://openalex.org/W2025819261","https://openalex.org/W2065383439","https://openalex.org/W2075250402","https://openalex.org/W2273799252","https://openalex.org/W2329547742","https://openalex.org/W2488548811","https://openalex.org/W2786171709","https://openalex.org/W2808284296","https://openalex.org/W2909660786","https://openalex.org/W2913752846","https://openalex.org/W2985025837","https://openalex.org/W3083442288","https://openalex.org/W3113436942","https://openalex.org/W3173970356","https://openalex.org/W3174952775","https://openalex.org/W4200032033","https://openalex.org/W4200631433","https://openalex.org/W4232616607","https://openalex.org/W4283372843","https://openalex.org/W4294008856","https://openalex.org/W4295786404","https://openalex.org/W4320062112","https://openalex.org/W4379537862","https://openalex.org/W4386915045","https://openalex.org/W4388581027","https://openalex.org/W6752636418","https://openalex.org/W7055069235"],"related_works":["https://openalex.org/W4399354997","https://openalex.org/W3008339103","https://openalex.org/W1667647204","https://openalex.org/W2404647514","https://openalex.org/W4252501555","https://openalex.org/W2003848320","https://openalex.org/W2005148983","https://openalex.org/W2012954338","https://openalex.org/W2096672917","https://openalex.org/W2392023973"],"abstract_inverted_index":{"Hybrid":[0],"MPI":[1,35,47,74,95,112],"+":[2],"X":[3],"models,":[4,15],"combining":[5],"the":[6,26,39,131,140],"Message":[7],"Passing":[8],"Interface":[9],"(MPI)":[10],"with":[11,70,86,98],"node-level":[12],"parallel":[13],"programming":[14],"increase":[16],"complexity":[17],"and":[18,41,46,56,63,77],"introduce":[19,50],"additional":[20],"correctness":[21,75,105],"issues.":[22],"This":[23],"work":[24],"addresses":[25],"challenges":[27],"of":[28,44,107,116,122,133],"detecting":[29],"data":[30,82],"races":[31],"in":[32,110],"hybrid":[33],"CUDA-aware":[34,111],"applications":[36],"due":[37],"to":[38,127,139],"asynchronous":[40],"non-blocking":[42],"nature":[43],"CUDA":[45],"APIs.":[48],"We":[49,67],"CuSan,":[51,99],"an":[52],"LLVM":[53],"compiler":[54],"extension,":[55],"runtime":[57,120],"that":[58],"tracks":[59],"CUDA-specific":[60],"concurrency,":[61],"synchronization,":[62],"memory":[64,134],"access":[65],"semantics.":[66],"integrate":[68],"CuSan":[69,123,149],"MUST,":[71],"a":[72,80],"dynamic":[73],"tool,":[76],"ThreadSanitizer":[78],"(TSan),":[79],"thread-level":[81],"race":[83],"detector.":[84],"MUST":[85],"TSan":[87],"can":[88],"already":[89],"detect":[90],"concurrency":[91,108],"issues":[92,109],"for":[93,103],"multi-threaded":[94],"codes.":[96],"Together":[97],"these":[100],"tools":[101],"allow":[102],"comprehensive":[104],"checking":[106],"applications.":[113],"Our":[114],"evaluation":[115],"two":[117],"mini-apps":[118],"reveals":[119],"overhead":[121,144],"ranging":[124],"from":[125],"6\u00d7":[126],"36\u00d7,":[128],"depending":[129],"on":[130],"amount":[132],"tracked":[135],"by":[136],"TSan,":[137],"compared":[138],"uninstrumented":[141],"version.":[142],"Memory":[143],"consistently":[145],"remains":[146],"under":[147],"1.8\u00d7.":[148],"is":[150],"available":[151],"at":[152],"https://github.com/tudasc/cusan.":[153]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-02-26T08:16:20.718346","created_date":"2025-10-10T00:00:00"}
