{"id":"https://openalex.org/W4416203799","doi":"https://doi.org/10.1145/3712285.3759768","title":"Characterizing Performance, Power, and Energy of AMD CDNA3 GPU Family","display_name":"Characterizing Performance, Power, and Energy of AMD CDNA3 GPU Family","publication_year":2025,"publication_date":"2025-11-12","ids":{"openalex":"https://openalex.org/W4416203799","doi":"https://doi.org/10.1145/3712285.3759768"},"language":null,"primary_location":{"id":"doi:10.1145/3712285.3759768","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3712285.3759768","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019583227","display_name":"Bagus Hanindhito","orcid":"https://orcid.org/0000-0002-8485-581X"},"institutions":[{"id":"https://openalex.org/I4210149435","display_name":"DELL (United States)","ror":"https://ror.org/05rejmm18","country_code":"US","type":"company","lineage":["https://openalex.org/I4210149435"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Bagus Hanindhito","raw_affiliation_strings":["Dell Technologies, Round Rock, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Dell Technologies, Round Rock, Texas, USA","institution_ids":["https://openalex.org/I4210149435"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064303476","display_name":"B. M. Patel","orcid":"https://orcid.org/0009-0007-8166-5686"},"institutions":[{"id":"https://openalex.org/I4210149435","display_name":"DELL (United States)","ror":"https://ror.org/05rejmm18","country_code":"US","type":"company","lineage":["https://openalex.org/I4210149435"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bhavesh Patel","raw_affiliation_strings":["Dell Technologies, Round Rock, Texas, USA"],"affiliations":[{"raw_affiliation_string":"Dell Technologies, Round Rock, Texas, USA","institution_ids":["https://openalex.org/I4210149435"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5019583227"],"corresponding_institution_ids":["https://openalex.org/I4210149435"],"apc_list":null,"apc_paid":null,"fwci":2.2703,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.90411102,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"905","last_page":"934"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.39899998903274536,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.39899998903274536,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.19830000400543213,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.05380000174045563,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.6488000154495239},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5081999897956848},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics","score":0.46399998664855957},{"id":"https://openalex.org/keywords/graphics-processing-unit","display_name":"Graphics processing unit","score":0.46129998564720154},{"id":"https://openalex.org/keywords/coprocessor","display_name":"Coprocessor","score":0.4595000147819519},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.45260000228881836},{"id":"https://openalex.org/keywords/graphics-hardware","display_name":"Graphics hardware","score":0.37779998779296875},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.375900000333786},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.3718999922275543}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7325999736785889},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.6488000154495239},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.6126999855041504},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5081999897956848},{"id":"https://openalex.org/C77660652","wikidata":"https://www.wikidata.org/wiki/Q150971","display_name":"Computer graphics","level":2,"score":0.46399998664855957},{"id":"https://openalex.org/C2779851693","wikidata":"https://www.wikidata.org/wiki/Q183484","display_name":"Graphics processing unit","level":2,"score":0.46129998564720154},{"id":"https://openalex.org/C86111242","wikidata":"https://www.wikidata.org/wiki/Q859595","display_name":"Coprocessor","level":2,"score":0.4595000147819519},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.45260000228881836},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4178999960422516},{"id":"https://openalex.org/C18945957","wikidata":"https://www.wikidata.org/wiki/Q5597193","display_name":"Graphics hardware","level":3,"score":0.37779998779296875},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.375900000333786},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.3718999922275543},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.36629998683929443},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.3555999994277954},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.3125999867916107},{"id":"https://openalex.org/C2985973956","wikidata":"https://www.wikidata.org/wiki/Q1617745","display_name":"High energy","level":2,"score":0.2888000011444092},{"id":"https://openalex.org/C106515295","wikidata":"https://www.wikidata.org/wiki/Q26806595","display_name":"Parallel processing","level":2,"score":0.2833000123500824},{"id":"https://openalex.org/C2989164559","wikidata":"https://www.wikidata.org/wiki/Q15637420","display_name":"Low energy","level":2,"score":0.2784999907016754},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.27799999713897705},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.2766999900341034},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.27559998631477356},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.27410000562667847},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.25999999046325684},{"id":"https://openalex.org/C2778305236","wikidata":"https://www.wikidata.org/wiki/Q178570","display_name":"OpenGL","level":3,"score":0.25850000977516174},{"id":"https://openalex.org/C537207887","wikidata":"https://www.wikidata.org/wiki/Q2816483","display_name":"Real-time computer graphics","level":4,"score":0.25760000944137573},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.2572000026702881},{"id":"https://openalex.org/C2985918086","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel architecture","level":3,"score":0.2533999979496002}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3712285.3759768","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3712285.3759768","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W858404628","https://openalex.org/W1031578623","https://openalex.org/W1133087070","https://openalex.org/W1964588245","https://openalex.org/W1974697321","https://openalex.org/W2005639572","https://openalex.org/W2027154929","https://openalex.org/W2039042415","https://openalex.org/W2067174909","https://openalex.org/W2078637295","https://openalex.org/W2093307449","https://openalex.org/W2128438553","https://openalex.org/W2141579716","https://openalex.org/W2155503253","https://openalex.org/W2165831368","https://openalex.org/W2169631286","https://openalex.org/W2171268876","https://openalex.org/W2174937805","https://openalex.org/W2617819327","https://openalex.org/W2791204867","https://openalex.org/W2791673912","https://openalex.org/W2794424798","https://openalex.org/W2906611591","https://openalex.org/W2913790721","https://openalex.org/W2964806098","https://openalex.org/W3035762603","https://openalex.org/W3036255981","https://openalex.org/W3082020764","https://openalex.org/W3091995851","https://openalex.org/W3138700303","https://openalex.org/W3158790368","https://openalex.org/W3185294035","https://openalex.org/W3205833606","https://openalex.org/W3217045543","https://openalex.org/W4220980777","https://openalex.org/W4221037885","https://openalex.org/W4244886992","https://openalex.org/W4282959339","https://openalex.org/W4283157303","https://openalex.org/W4297325261","https://openalex.org/W4309672181","https://openalex.org/W4311145589","https://openalex.org/W4312580880","https://openalex.org/W4313372317","https://openalex.org/W4313374006","https://openalex.org/W4313384369","https://openalex.org/W4319870545","https://openalex.org/W4360980513","https://openalex.org/W4380874680","https://openalex.org/W4385416665","https://openalex.org/W4386124159","https://openalex.org/W4388102819","https://openalex.org/W4388580994","https://openalex.org/W4388581111","https://openalex.org/W4390100804","https://openalex.org/W4390490761","https://openalex.org/W4391136507","https://openalex.org/W4391215636","https://openalex.org/W4392746141","https://openalex.org/W4394998727","https://openalex.org/W4395020691","https://openalex.org/W4396686649","https://openalex.org/W4396814805","https://openalex.org/W4396949324","https://openalex.org/W4398774928","https://openalex.org/W4399074329","https://openalex.org/W4399438280","https://openalex.org/W4400154247","https://openalex.org/W4400680326","https://openalex.org/W4400681470","https://openalex.org/W4401211711","https://openalex.org/W4401881165","https://openalex.org/W4403211091","https://openalex.org/W4403564357","https://openalex.org/W4403983018","https://openalex.org/W4404847991","https://openalex.org/W4406157308","https://openalex.org/W4406157579","https://openalex.org/W4407881031","https://openalex.org/W4408564916","https://openalex.org/W4408903522","https://openalex.org/W4409248836","https://openalex.org/W4410049458","https://openalex.org/W4413458368","https://openalex.org/W4414796894"],"related_works":[],"abstract_inverted_index":{"While":[0],"historically":[1],"used":[2],"for":[3,16,27],"graphics":[4],"applications,":[5],"Graphics":[6],"Processing":[7],"Units":[8],"(GPUs)":[9],"have":[10],"become":[11],"the":[12,25,32,50,55],"most":[13],"prominent":[14],"hardware":[15],"accelerating":[17],"parallel":[18],"workloads,":[19],"including":[20],"HPC":[21,37],"and":[22,38,57,64,69],"AI/ML.":[23],"As":[24],"demand":[26],"GPUs":[28],"skyrockets,":[29],"AMD":[30,51],"released":[31],"CDNA3":[33,52],"architecture":[34],"to":[35],"accelerate":[36],"generative":[39],"AI.":[40],"This":[41],"paper":[42],"serves":[43],"as":[44],"a":[45],"comprehensive":[46],"third-party":[47],"evaluation":[48],"of":[49],"GPU,":[53],"specifically":[54],"MI300X":[56],"MI325X,":[58],"by":[59],"characterizing":[60],"their":[61],"performance,":[62],"power,":[63],"energy":[65],"efficiency":[66],"using":[67],"microbenchmark":[68],"real-world":[70],"applications.":[71]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-11-12T00:00:00"}
