{"id":"https://openalex.org/W4393140968","doi":"https://doi.org/10.1109/asp-dac58780.2024.10473955","title":"WER: Maximizing Parallelism of Irregular Graph Applications Through GPU Warp EqualizeR","display_name":"WER: Maximizing Parallelism of Irregular Graph Applications Through GPU Warp EqualizeR","publication_year":2024,"publication_date":"2024-01-22","ids":{"openalex":"https://openalex.org/W4393140968","doi":"https://doi.org/10.1109/asp-dac58780.2024.10473955"},"language":"en","primary_location":{"id":"doi:10.1109/asp-dac58780.2024.10473955","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/asp-dac58780.2024.10473955","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 29th Asia and South Pacific Design Automation Conference (ASP-DAC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067971879","display_name":"En-Ming Huang","orcid":"https://orcid.org/0000-0003-2196-2834"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"En-Ming Huang","raw_affiliation_strings":["National Tsing Hua University,Elsa Lab,Department of Computer Science,Hsinchu City,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Tsing Hua University,Elsa Lab,Department of Computer Science,Hsinchu City,Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032713461","display_name":"Bo-Wun Cheng","orcid":"https://orcid.org/0000-0001-5756-2301"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Bo-Wun Cheng","raw_affiliation_strings":["National Tsing Hua University,Elsa Lab,Department of Computer Science,Hsinchu City,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Tsing Hua University,Elsa Lab,Department of Computer Science,Hsinchu City,Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109908128","display_name":"Meng-Hsien Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Meng-Hsien Lin","raw_affiliation_strings":["National Yang Ming Chiao Tung University,Department of Computer Science,Hsinchu City,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,Department of Computer Science,Hsinchu City,Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028600832","display_name":"Chun\u2010Yi Lee","orcid":"https://orcid.org/0000-0002-4680-4800"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chun-Yi Lee","raw_affiliation_strings":["National Tsing Hua University,Elsa Lab,Department of Computer Science,Hsinchu City,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Tsing Hua University,Elsa Lab,Department of Computer Science,Hsinchu City,Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019259173","display_name":"Tsung Tai Yeh","orcid":"https://orcid.org/0000-0002-2401-9916"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Tsung Tai Yeh","raw_affiliation_strings":["National Yang Ming Chiao Tung University,Department of Computer Science,Hsinchu City,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,Department of Computer Science,Hsinchu City,Taiwan","institution_ids":["https://openalex.org/I148366613"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5067971879"],"corresponding_institution_ids":["https://openalex.org/I25846049"],"apc_list":null,"apc_paid":null,"fwci":0.265,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.47236582,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"201","last_page":"206"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.978600025177002,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9732000231742859,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.8161944150924683},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8058383464813232},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.5553916692733765},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5233715772628784},{"id":"https://openalex.org/keywords/data-parallelism","display_name":"Data parallelism","score":0.46006524562835693},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.43006718158721924},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2517862319946289}],"concepts":[{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.8161944150924683},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8058383464813232},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.5553916692733765},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5233715772628784},{"id":"https://openalex.org/C61483411","wikidata":"https://www.wikidata.org/wiki/Q3124522","display_name":"Data parallelism","level":3,"score":0.46006524562835693},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.43006718158721924},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2517862319946289}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asp-dac58780.2024.10473955","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/asp-dac58780.2024.10473955","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 29th Asia and South Pacific Design Automation Conference (ASP-DAC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320331164","display_name":"National Science and Technology Council","ror":"https://ror.org/00wnb9798"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1994473607","https://openalex.org/W2021211271","https://openalex.org/W2105102111","https://openalex.org/W2295258302","https://openalex.org/W2505199798","https://openalex.org/W2755088640","https://openalex.org/W2790789009","https://openalex.org/W2792834173","https://openalex.org/W2976859544","https://openalex.org/W3102510044","https://openalex.org/W3160477826","https://openalex.org/W3160872503","https://openalex.org/W3201491683","https://openalex.org/W3206857466","https://openalex.org/W4237819810","https://openalex.org/W6792319920"],"related_works":["https://openalex.org/W3213381848","https://openalex.org/W2005148983","https://openalex.org/W2017587301","https://openalex.org/W2012954338","https://openalex.org/W2096672917","https://openalex.org/W2392023973","https://openalex.org/W2939411666","https://openalex.org/W2009169896","https://openalex.org/W4230999561","https://openalex.org/W1595672120"],"abstract_inverted_index":{"Irregular":[0],"graphs":[1,24],"are":[2],"becoming":[3],"increasingly":[4],"prevalent":[5],"across":[6],"a":[7,90,101,113,118,142,156],"broad":[8],"spectrum":[9],"of":[10,22,30,53,70,97,160],"data":[11],"analysis":[12],"applications.":[13],"Despite":[14],"their":[15],"versatility,":[16],"the":[17,28,51,95,138,167],"inherent":[18],"complexity":[19],"and":[20,56,76,112,135,163,170],"irregularity":[21],"these":[23,83],"often":[25],"result":[26],"in":[27,124],"underutilization":[29,45],"Single":[31],"Instruction,":[32],"Multiple":[33],"Data":[34],"(SIMD)":[35],"resources":[36,99,140],"when":[37],"processed":[38],"on":[39,100],"Graphics":[40],"Processing":[41],"Units":[42],"(GPUs).":[43],"This":[44],"originates":[46],"from":[47],"two":[48],"primary":[49],"issues:":[50],"occurrence":[52],"inactive":[54],"threads":[55],"intra-warp":[57],"load":[58],"imbalances.":[59],"These":[60],"issues":[61],"can":[62],"produce":[63],"idle":[64],"threads,":[65],"lead":[66],"to":[67,93,130],"inefficient":[68],"usage":[69],"SIMD":[71,98,132,139],"resources,":[72],"consequently":[73],"hamper":[74],"throughput,":[75],"increase":[77],"program":[78],"execution":[79],"time.":[80],"To":[81],"address":[82],"challenges,":[84],"we":[85],"introduce":[86],"Warp":[87],"EqualizeR":[88],"(WER),":[89],"framework":[91],"designed":[92],"optimize":[94],"utilization":[96,134],"GPU":[102,169],"for":[103],"processing":[104],"irregular":[105,125],"graphs.":[106],"WER":[107,129,154],"employs":[108],"both":[109],"software":[110],"API":[111],"specifically-tailored":[114],"hardware":[115],"microarchitecture.":[116],"Such":[117],"synergistic":[119],"approach":[120],"enables":[121],"workload":[122],"redistribution":[123],"graphs,":[126],"which":[127],"allows":[128],"enhance":[131],"lane":[133],"further":[136],"harness":[137],"within":[141],"GPU.":[143],"Our":[144],"experimental":[145],"results":[146],"over":[147,166],"seven":[148],"different":[149],"graph":[150],"applications":[151],"indicate":[152],"that":[153],"yields":[155],"geometric":[157],"mean":[158],"speedup":[159],"$2.52":[161],"\\times$":[162,165],"$1.47":[164],"baseline":[168],"existing":[171],"state-of-the-art":[172],"methodologies,":[173],"respectively.":[174]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2025-10-10T00:00:00"}
