{"id":"https://openalex.org/W4410321786","doi":"https://doi.org/10.1145/3725798.3725805","title":"Performance Impact and Trade-Offs for Tuning Key Architectural Parameters on CPU+GPU Systems","display_name":"Performance Impact and Trade-Offs for Tuning Key Architectural Parameters on CPU+GPU Systems","publication_year":2025,"publication_date":"2025-03-01","ids":{"openalex":"https://openalex.org/W4410321786","doi":"https://doi.org/10.1145/3725798.3725805"},"language":"en","primary_location":{"id":"doi:10.1145/3725798.3725805","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3725798.3725805","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3725798.3725805","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th Workshop on General Purpose Processing Using GPU","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3725798.3725805","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014340343","display_name":"Kazi Asifuzzaman","orcid":"https://orcid.org/0000-0002-4004-4791"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kazi Asifuzzaman","raw_affiliation_strings":["Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA"],"affiliations":[{"raw_affiliation_string":"Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031971317","display_name":"Narasinga Rao Miniskar","orcid":"https://orcid.org/0000-0001-8259-8891"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Narasinga Rao Miniskar","raw_affiliation_strings":["Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA"],"affiliations":[{"raw_affiliation_string":"Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032103653","display_name":"William F. Godoy","orcid":"https://orcid.org/0000-0002-2590-5178"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William Godoy","raw_affiliation_strings":["Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA"],"affiliations":[{"raw_affiliation_string":"Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071822072","display_name":"\u00d3scar Hern\u00e1ndez","orcid":"https://orcid.org/0000-0002-5380-6951"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Oscar Hernandez","raw_affiliation_strings":["Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA"],"affiliations":[{"raw_affiliation_string":"Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061838490","display_name":"Jeffrey S. Vetter","orcid":"https://orcid.org/0000-0002-2449-6720"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jeffrey S. Vetter","raw_affiliation_strings":["Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA"],"affiliations":[{"raw_affiliation_string":"Oak Ridge National Laboratory, Oak Ridge, Tennessee, USA","institution_ids":["https://openalex.org/I1289243028"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5014340343"],"corresponding_institution_ids":["https://openalex.org/I1289243028"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08298927,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"42","last_page":"47"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.7203959226608276},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6371057629585266},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.46736642718315125},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.389908105134964},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.36798131465911865},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.17794543504714966}],"concepts":[{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.7203959226608276},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6371057629585266},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.46736642718315125},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.389908105134964},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.36798131465911865},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.17794543504714966}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3725798.3725805","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3725798.3725805","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3725798.3725805","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th Workshop on General Purpose Processing Using GPU","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3725798.3725805","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3725798.3725805","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3725798.3725805","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th Workshop on General Purpose Processing Using GPU","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1719536385","display_name":null,"funder_award_id":"DE-AC05-00OR22725","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G6403792893","display_name":null,"funder_award_id":"DE-FOA-0002950","funder_id":"https://openalex.org/F4320332359","funder_display_name":"Office of Science"},{"id":"https://openalex.org/G6415871857","display_name":null,"funder_award_id":"DE-FOA-0002950","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G8906985441","display_name":null,"funder_award_id":"00OR22725","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"}],"funders":[{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320306250","display_name":"Battelle","ror":"https://ror.org/01h5tnr73"},{"id":"https://openalex.org/F4320332359","display_name":"Office of Science","ror":"https://ror.org/00mmn6b08"},{"id":"https://openalex.org/F4320337506","display_name":"Advanced Scientific Computing Research","ror":"https://ror.org/0012c7r22"},{"id":"https://openalex.org/F4320338287","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4410321786.pdf","grobid_xml":"https://content.openalex.org/works/W4410321786.grobid-xml"},"referenced_works_count":12,"referenced_works":["https://openalex.org/W1979527452","https://openalex.org/W2103742924","https://openalex.org/W2106562406","https://openalex.org/W2110195531","https://openalex.org/W2622164283","https://openalex.org/W2787181861","https://openalex.org/W3012233231","https://openalex.org/W3102510044","https://openalex.org/W3102618228","https://openalex.org/W3159534764","https://openalex.org/W4246036875","https://openalex.org/W4327911463"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3],"performed":[4],"an":[5,11],"initial":[6],"design":[7,61],"space":[8],"exploration":[9],"of":[10,59,67,75,136],"accelerated":[12],"processing":[13],"unit":[14],"(APU)-a":[15],"hybrid":[16],"CPU+GPU":[17],"architecture":[18],"that":[19,98],"integrates":[20],"both":[21],"compute":[22],"units":[23],"(CUs)":[24],"and":[25,40,48,69,91,108,111,129,146],"memory":[26,38,52,71,87,131,147],"into":[27],"a":[28,114],"unified":[29],"system.This":[30],"integration":[31],"aims":[32],"to":[33,50,102,138],"reduce":[34],"data":[35,89,144],"movement,":[36,145],"enhance":[37],"locality,":[39],"improve":[41],"energy":[42],"efficiency":[43],"by":[44,121],"enabling":[45],"the":[46,57,65,73,82,134],"CPU":[47],"GPU":[49],"share":[51],"directly.This":[53],"effort":[54],"focused":[55],"on":[56,86],"interplay":[58],"key":[60],"components-cache":[62],"line":[63],"size,":[64],"number":[66],"CUs,":[68],"main":[70],"technology-and":[72],"trade-offs":[74],"each":[76],"configuration":[77],"were":[78],"analyzed.This":[79],"paper":[80],"highlights":[81],"various":[83],"configurations'":[84],"impact":[85],"accesses,":[88],"reuse,":[90],"power":[92,148],"utilization.The":[93],"results":[94],"provide":[95],"valuable":[96],"insights":[97],"can":[99,118],"be":[100,119],"leveraged":[101],"optimize":[103],"APU":[104],"architectures":[105],"for":[106],"high-performance":[107],"energy-efficient":[109],"computing":[110],"thus":[112],"create":[113],"balanced":[115],"architecture.This":[116],"optimization":[117],"achieved":[120],"adopting":[122],"dynamic":[123],"cache":[124],"management,":[125],"runtime":[126],"CU":[127],"scaling,":[128],"advanced":[130],"integration,":[132],"highlighting":[133],"potential":[135],"APUs":[137],"address":[139],"critical":[140],"challenges":[141],"in":[142],"compute,":[143],"consumption.":[149]},"counts_by_year":[],"updated_date":"2026-04-15T08:11:43.952461","created_date":"2025-10-10T00:00:00"}
