{"id":"https://openalex.org/W4412480907","doi":"https://doi.org/10.1145/3694906.3743337","title":"Eliminating Bank Conflicts in GPU Mergesort","display_name":"Eliminating Bank Conflicts in GPU Mergesort","publication_year":2025,"publication_date":"2025-07-16","ids":{"openalex":"https://openalex.org/W4412480907","doi":"https://doi.org/10.1145/3694906.3743337"},"language":"en","primary_location":{"id":"doi:10.1145/3694906.3743337","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3694906.3743337","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3694906.3743337","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 37th ACM Symposium on Parallelism in Algorithms and Architectures","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3694906.3743337","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005396551","display_name":"Kyle Berney","orcid":"https://orcid.org/0000-0001-8918-7067"},"institutions":[{"id":"https://openalex.org/I117965899","display_name":"University of Hawai\u02bbi at M\u0101noa","ror":"https://ror.org/01wspgy28","country_code":"US","type":"education","lineage":["https://openalex.org/I117965899"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kyle Berney","raw_affiliation_strings":["University of Hawaii at M\u0101noa, Honolulu, HI, USA"],"raw_orcid":"https://orcid.org/0000-0001-8918-7067","affiliations":[{"raw_affiliation_string":"University of Hawaii at M\u0101noa, Honolulu, HI, USA","institution_ids":["https://openalex.org/I117965899"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015446804","display_name":"Nodari Sitchinava","orcid":"https://orcid.org/0000-0001-8876-4846"},"institutions":[{"id":"https://openalex.org/I117965899","display_name":"University of Hawai\u02bbi at M\u0101noa","ror":"https://ror.org/01wspgy28","country_code":"US","type":"education","lineage":["https://openalex.org/I117965899"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nodari Sitchinava","raw_affiliation_strings":["University of Hawaii at M\u0101noa, Honolulu, HI, USA"],"raw_orcid":"https://orcid.org/0000-0001-8876-4846","affiliations":[{"raw_affiliation_string":"University of Hawaii at M\u0101noa, Honolulu, HI, USA","institution_ids":["https://openalex.org/I117965899"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5005396551"],"corresponding_institution_ids":["https://openalex.org/I117965899"],"apc_list":null,"apc_paid":null,"fwci":1.3517,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.83801839,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"158","last_page":"170"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9854999780654907,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9854999780654907,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9653000235557556,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9031999707221985,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6978486180305481},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.42702940106391907}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6978486180305481},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.42702940106391907}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3694906.3743337","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3694906.3743337","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3694906.3743337","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 37th ACM Symposium on Parallelism in Algorithms and Architectures","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3694906.3743337","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3694906.3743337","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3694906.3743337","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 37th ACM Symposium on Parallelism in Algorithms and Architectures","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1201407526","display_name":"AF: Small: Toward A Unified Model of Parallelism And Locality","funder_award_id":"1911245","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5903772271","display_name":"AF: SMALL: Parallel Cache-efficient Data Structures","funder_award_id":"2432018","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6554605010","display_name":null,"funder_award_id":"1911245, 2432018","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"},{"id":"https://openalex.org/G88582782","display_name":null,"funder_award_id":"CCF-1911245","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412480907.pdf","grobid_xml":"https://content.openalex.org/works/W4412480907.grobid-xml"},"referenced_works_count":20,"referenced_works":["https://openalex.org/W1555673550","https://openalex.org/W1974312429","https://openalex.org/W1984164247","https://openalex.org/W1985416860","https://openalex.org/W2038142281","https://openalex.org/W2066015450","https://openalex.org/W2109605977","https://openalex.org/W2117148224","https://openalex.org/W2142193847","https://openalex.org/W2162707967","https://openalex.org/W2415865954","https://openalex.org/W2415973476","https://openalex.org/W2502734103","https://openalex.org/W2725215886","https://openalex.org/W3021786344","https://openalex.org/W3117864297","https://openalex.org/W3164851128","https://openalex.org/W4301891805","https://openalex.org/W4409174475","https://openalex.org/W4412480907"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Graphics":[0],"Processing":[1],"Units":[2],"(GPUs)":[3],"have":[4],"emerged":[5],"as":[6,37,64],"popular":[7],"architectures":[8],"for":[9,55],"high-performance":[10],"computing":[11],"due":[12,29],"to":[13,30],"their":[14],"parallelism":[15,50],"and":[16,51],"low":[17],"latency":[18],"context":[19],"switching":[20],"capabilities.":[21],"However,":[22],"optimizing":[23],"GPU":[24,80],"implementations":[25],"can":[26,67],"be":[27],"challenging":[28],"the":[31,34,38,73],"complexity":[32],"of":[33,41,75,79],"architecture,":[35],"such":[36],"diverse":[39],"characteristics":[40],"memory":[42,53,58],"units.":[43],"While":[44],"most":[45],"optimization":[46],"efforts":[47],"focus":[48],"on":[49],"global":[52],"access,":[54],"some":[56],"algorithms":[57],"conflicts":[59],"in":[60],"shared":[61],"memory,":[62],"known":[63],"bank":[65],"conflicts,":[66],"significantly":[68],"impact":[69],"performance.":[70],"This":[71],"affects":[72],"accuracy":[74],"theoretical":[76],"runtime":[77],"analysis":[78],"algorithms.":[81]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
