{"id":"https://openalex.org/W3206908800","doi":"https://doi.org/10.1145/3470644","title":"Pointer-Based Divergence Analysis for OpenCL 2.0 Programs","display_name":"Pointer-Based Divergence Analysis for OpenCL 2.0 Programs","publication_year":2021,"publication_date":"2021-10-15","ids":{"openalex":"https://openalex.org/W3206908800","doi":"https://doi.org/10.1145/3470644","mag":"3206908800"},"language":"en","primary_location":{"id":"doi:10.1145/3470644","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3470644","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037552091","display_name":"Shao-Chung Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shao-Chung Wang","raw_affiliation_strings":["National Tsing Hua University, Hsinchu, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Tsing Hua University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024338470","display_name":"Lin-Ya Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Lin-Ya Yu","raw_affiliation_strings":["National Tsing Hua University, Hsinchu, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Tsing Hua University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053774690","display_name":"Li-An Her","orcid":null},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Li-An Her","raw_affiliation_strings":["National Tsing Hua University, Hsinchu, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Tsing Hua University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041551416","display_name":"Yuan\u2010Shin Hwang","orcid":null},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yuan-Shin Hwang","raw_affiliation_strings":["National Taiwan University of Science and Technology, Taipei, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taiwan University of Science and Technology, Taipei, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038803698","display_name":"Jenq\u2010Kuen Lee","orcid":"https://orcid.org/0000-0001-9919-6258"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jenq-Kuen Lee","raw_affiliation_strings":["National Tsing Hua University, Hsinchu, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Tsing Hua University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.8878,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.85865237,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":"8","issue":"4","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8651821613311768},{"id":"https://openalex.org/keywords/pointer","display_name":"Pointer (user interface)","score":0.7509758472442627},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7502642869949341},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.7465384006500244},{"id":"https://openalex.org/keywords/pointer-analysis","display_name":"Pointer analysis","score":0.5271719694137573},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.5239605903625488},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.5229806900024414},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4642791152000427},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.42534857988357544},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.39899611473083496},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3425227999687195},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.29002952575683594},{"id":"https://openalex.org/keywords/static-analysis","display_name":"Static analysis","score":0.260733962059021},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.08068925142288208}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8651821613311768},{"id":"https://openalex.org/C150202949","wikidata":"https://www.wikidata.org/wiki/Q107602","display_name":"Pointer (user interface)","level":2,"score":0.7509758472442627},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7502642869949341},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.7465384006500244},{"id":"https://openalex.org/C7263679","wikidata":"https://www.wikidata.org/wiki/Q5978076","display_name":"Pointer analysis","level":3,"score":0.5271719694137573},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.5239605903625488},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.5229806900024414},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4642791152000427},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.42534857988357544},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.39899611473083496},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3425227999687195},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.29002952575683594},{"id":"https://openalex.org/C97686452","wikidata":"https://www.wikidata.org/wiki/Q7604153","display_name":"Static analysis","level":2,"score":0.260733962059021},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.08068925142288208},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3470644","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3470644","pdf_url":null,"source":{"id":"https://openalex.org/S2483380313","display_name":"ACM Transactions on Parallel Computing","issn_l":"2329-4949","issn":["2329-4949","2329-4957"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Parallel Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322410","display_name":"MediaTek","ror":"https://ror.org/05g9jck81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W38257615","https://openalex.org/W220935706","https://openalex.org/W1483717008","https://openalex.org/W1870686413","https://openalex.org/W1954658694","https://openalex.org/W1982205631","https://openalex.org/W1985372145","https://openalex.org/W1990087033","https://openalex.org/W1992851788","https://openalex.org/W1994316441","https://openalex.org/W1995268554","https://openalex.org/W2002771912","https://openalex.org/W2010452422","https://openalex.org/W2012630996","https://openalex.org/W2013247896","https://openalex.org/W2014030893","https://openalex.org/W2080592089","https://openalex.org/W2089482246","https://openalex.org/W2101430044","https://openalex.org/W2124556751","https://openalex.org/W2128329055","https://openalex.org/W2134705409","https://openalex.org/W2143798346","https://openalex.org/W2147654959","https://openalex.org/W2153185479","https://openalex.org/W2156540297","https://openalex.org/W2156831150","https://openalex.org/W2167675119","https://openalex.org/W2169880332","https://openalex.org/W2222659926","https://openalex.org/W2240827923","https://openalex.org/W2262439752","https://openalex.org/W2521014836","https://openalex.org/W2767882261","https://openalex.org/W2780934147","https://openalex.org/W2798404616","https://openalex.org/W3003065932","https://openalex.org/W3013258932","https://openalex.org/W3013490664","https://openalex.org/W3013976982","https://openalex.org/W3138798301","https://openalex.org/W4240331105"],"related_works":["https://openalex.org/W2553375745","https://openalex.org/W2363386825","https://openalex.org/W2188526093","https://openalex.org/W1996094959","https://openalex.org/W2999115679","https://openalex.org/W2370320024","https://openalex.org/W3147482974","https://openalex.org/W2111180768","https://openalex.org/W2362627649","https://openalex.org/W2260512874"],"abstract_inverted_index":{"A":[0,82],"modern":[1],"GPU":[2,43],"is":[3,33,45,121,150,195,311,322],"designed":[4],"with":[5,49,74,225,228,242,296],"many":[6],"large":[7],"thread":[8],"groups":[9],"to":[10,35,153,218],"achieve":[11],"a":[12,40,50,107,155,229,316,320],"high":[13,51],"throughput":[14],"and":[15,71,80,88,96,129,134,139,170,214,247,275,293,299,325],"performance.":[16],"Within":[17],"these":[18],"groups,":[19],"the":[20,30,75,112,163,168,178,185,189,261,266,270,278,283,308,326],"threads":[21],"are":[22],"grouped":[23],"into":[24],"fixed-size":[25],"SIMD":[26],"batches":[27],"in":[28,39,210,237,268,318],"which":[29,149,269,319],"same":[31],"instruction":[32],"applied":[34,217],"vectors":[36],"of":[37,53,162,167,177,188,234,254,286],"data":[38,54],"lockstep.":[41],"This":[42],"architecture":[44],"suitable":[46],"for":[47,66,115,198,260,265,277],"applications":[48],"degree":[52],"parallelism,":[55],"but":[56],"its":[57],"performance":[58],"degrades":[59],"seriously":[60],"when":[61],"divergence":[62,67,76,94,113,156,172,175,186,190],"occurs.":[63],"Many":[64],"optimizations":[65],"have":[68],"been":[69],"proposed,":[70],"they":[72],"vary":[73],"information":[77,114],"about":[78],"variables":[79,288],"branches.":[81,302],"previous":[83],"analysis":[84],"scheme":[85,109,144,194,207,267,310,317],"viewed":[86],"pointers":[87,169,179,256],"return":[89],"values":[90],"from":[91,136],"functions":[92,133],"as":[93],"directly,":[95],"only":[97],"focused":[98],"on":[99,123],"OpenCL":[100,117,219],"1.x.":[101],"In":[102],"this":[103],"article,":[104],"we":[105],"present":[106],"novel":[108],"that":[110,159,307],"reports":[111],"pointer-intensive":[116],"programs.":[118,220],"The":[119,142,174,193,205,251],"approach":[120],"based":[122],"extended":[124,147,197],"static":[125],"single":[126],"assignment":[127],"(SSA)":[128],"adds":[130],"some":[131],"special":[132],"annotations":[135],"memory":[137],"SSA":[138],"gated":[140],"SSA.":[141],"proposed":[143,206,262,309],"first":[145],"constructs":[146],"SSA,":[148],"then":[151],"used":[152],"build":[154],"relation":[157,191],"graph":[158],"includes":[160],"all":[161],"possible":[164],"points-to":[165],"relationships":[166],"initialized":[171],"states.":[173],"state":[176,187],"can":[180,215],"be":[181,216],"determined":[182],"by":[183,201],"propagating":[184],"graph.":[192],"further":[196],"interprocedural":[199],"cases":[200],"considering":[202],"function-related":[203],"statements.":[204,250],"was":[208,258,272],"implemented":[209],"an":[211,238],"LLVM":[212,239,280,328],"compiler":[213],"We":[221],"analyzed":[222,231],"10":[223],"programs":[224],"24":[226],"kernels,":[227],"total":[230,252,284],"program":[232],"size":[233],"1,306":[235],"instructions":[236],"intermediate":[240],"representation,":[241],"885":[243],"variables,":[244],"108":[245],"branches,":[246],"313":[248],"pointer-related":[249],"number":[253],"divergent":[255,287,301,324],"detected":[257,289],"146":[259],"scheme,":[263],"200":[264],"pointer":[271,321],"always":[273,323],"divergent,":[274],"155":[276],"current":[279,327],"default":[281,329],"scheme;":[282],"numbers":[285],"were":[290],"458,":[291],"519,":[292],"482,":[294],"respectively,":[295],"31,":[297],"34,":[298],"32":[300],"These":[303],"experimental":[304],"results":[305],"indicate":[306],"more":[312],"precise":[313],"than":[314],"both":[315],"scheme.":[330]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
