{"id":"https://openalex.org/W7125385736","doi":"https://doi.org/10.1145/3784828.3785157","title":"System-Level Energy Profiling of Wafer-Scale AI Systems: Characterizing Non-Accelerator Overheads in the Cerebras CS-2 System","display_name":"System-Level Energy Profiling of Wafer-Scale AI Systems: Characterizing Non-Accelerator Overheads in the Cerebras CS-2 System","publication_year":2026,"publication_date":"2026-01-22","ids":{"openalex":"https://openalex.org/W7125385736","doi":"https://doi.org/10.1145/3784828.3785157"},"language":null,"primary_location":{"id":"doi:10.1145/3784828.3785157","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3784828.3785157","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Supercomputing Asia and International Conference on High Performance Computing in Asia Pacific Region Workshops","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3784828.3785157","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085442143","display_name":"Jophin John","orcid":null},"institutions":[{"id":"https://openalex.org/I4210163716","display_name":"Leibniz Supercomputing Centre","ror":"https://ror.org/05558nw16","country_code":"DE","type":"facility","lineage":["https://openalex.org/I109144446","https://openalex.org/I4210163716"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Jophin John","raw_affiliation_strings":["Leibniz Supercomputing Centre (LRZ), Garching near Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Leibniz Supercomputing Centre (LRZ), Garching near Munich, Germany","institution_ids":["https://openalex.org/I4210163716"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064628804","display_name":"Hoi Wah Mak","orcid":null},"institutions":[{"id":"https://openalex.org/I4210163716","display_name":"Leibniz Supercomputing Centre","ror":"https://ror.org/05558nw16","country_code":"DE","type":"facility","lineage":["https://openalex.org/I109144446","https://openalex.org/I4210163716"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Hoi-Fong Mak","raw_affiliation_strings":["Leibniz Supercomputing Centre (LRZ), Garching near Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Leibniz Supercomputing Centre (LRZ), Garching near Munich, Germany","institution_ids":["https://openalex.org/I4210163716"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123610874","display_name":"Michael Hoffmann","orcid":null},"institutions":[{"id":"https://openalex.org/I4210163716","display_name":"Leibniz Supercomputing Centre","ror":"https://ror.org/05558nw16","country_code":"DE","type":"facility","lineage":["https://openalex.org/I109144446","https://openalex.org/I4210163716"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Michael Hoffmann","raw_affiliation_strings":["Leibniz Supercomputing Centre (LRZ), Garching near Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Leibniz Supercomputing Centre (LRZ), Garching near Munich, Germany","institution_ids":["https://openalex.org/I4210163716"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123542550","display_name":"Alice Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140540","display_name":"Singularity University","ror":"https://ror.org/04rv9a088","country_code":"US","type":"education","lineage":["https://openalex.org/I4210140540"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alice Zhang","raw_affiliation_strings":["Cerebras Systems, Sunnyvale, USA"],"affiliations":[{"raw_affiliation_string":"Cerebras Systems, Sunnyvale, USA","institution_ids":["https://openalex.org/I4210140540"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082396646","display_name":"Tapasya Patki","orcid":"https://orcid.org/0000-0003-2543-9688"},"institutions":[{"id":"https://openalex.org/I1282311441","display_name":"Lawrence Livermore National Laboratory","ror":"https://ror.org/041nk4h53","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282311441","https://openalex.org/I1330989302","https://openalex.org/I198811213","https://openalex.org/I4210138311"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tapasya Patki","raw_affiliation_strings":["Lawrence Livermore National Laboratory, Livermore, USA"],"affiliations":[{"raw_affiliation_string":"Lawrence Livermore National Laboratory, Livermore, USA","institution_ids":["https://openalex.org/I1282311441"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048904411","display_name":"Nicolay Hammer","orcid":"https://orcid.org/0000-0001-6258-8813"},"institutions":[{"id":"https://openalex.org/I4210163716","display_name":"Leibniz Supercomputing Centre","ror":"https://ror.org/05558nw16","country_code":"DE","type":"facility","lineage":["https://openalex.org/I109144446","https://openalex.org/I4210163716"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Nicolay Hammer","raw_affiliation_strings":["Leibniz Supercomputing Centre (LRZ), Garching near Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Leibniz Supercomputing Centre (LRZ), Garching near Munich, Germany","institution_ids":["https://openalex.org/I4210163716"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5085442143"],"corresponding_institution_ids":["https://openalex.org/I4210163716"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37203559,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"31","last_page":"39"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12238","display_name":"Green IT and Sustainability","score":0.2257000058889389,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12238","display_name":"Green IT and Sustainability","score":0.2257000058889389,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.13490000367164612,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.12189999967813492,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.7218000292778015},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.6704000234603882},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.47999998927116394},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.4690999984741211},{"id":"https://openalex.org/keywords/energy-management-system","display_name":"Energy management system","score":0.4438000023365021},{"id":"https://openalex.org/keywords/energy-management","display_name":"Energy management","score":0.4408000111579895},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.4074999988079071}],"concepts":[{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.7218000292778015},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.6704000234603882},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6568999886512756},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.49390000104904175},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.47999998927116394},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.4690999984741211},{"id":"https://openalex.org/C2781260460","wikidata":"https://www.wikidata.org/wiki/Q6139999","display_name":"Energy management system","level":4,"score":0.4438000023365021},{"id":"https://openalex.org/C7817414","wikidata":"https://www.wikidata.org/wiki/Q1779504","display_name":"Energy management","level":3,"score":0.4408000111579895},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.4074999988079071},{"id":"https://openalex.org/C2984118289","wikidata":"https://www.wikidata.org/wiki/Q29954","display_name":"Power consumption","level":3,"score":0.36739999055862427},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.29899999499320984},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.2935999929904938},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.29319998621940613},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2851000130176544},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.2833000123500824},{"id":"https://openalex.org/C153740404","wikidata":"https://www.wikidata.org/wiki/Q671224","display_name":"Data center","level":2,"score":0.28299999237060547},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3784828.3785157","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3784828.3785157","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Supercomputing Asia and International Conference on High Performance Computing in Asia Pacific Region Workshops","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3784828.3785157","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3784828.3785157","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Supercomputing Asia and International Conference on High Performance Computing in Asia Pacific Region Workshops","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.5192975997924805}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2038924755","https://openalex.org/W3021539948","https://openalex.org/W4288086139","https://openalex.org/W4376130831","https://openalex.org/W4406708607","https://openalex.org/W4406895142","https://openalex.org/W4411344667","https://openalex.org/W4413019615","https://openalex.org/W4414498719","https://openalex.org/W4415428766"],"related_works":[],"abstract_inverted_index":{"The":[0,114],"escalating":[1],"energy":[2,38,105,128,149,162],"demands":[3],"of":[4,17,84,104,125,142],"large-scale":[5],"artificial":[6],"intelligence":[7],"(AI)":[8],"training":[9],"highlight":[10,139],"the":[11,34,42,135,140],"need":[12],"for":[13,28,60,121,159],"a":[14,93,100,144],"holistic":[15],"understanding":[16],"power":[18],"consumption":[19,106],"across":[20,107],"complete":[21],"computing":[22],"systems.":[23],"This":[24],"is":[25],"particularly":[26],"important":[27],"emerging":[29],"wafer-scale":[30,152],"architectures":[31],"such":[32,50],"as":[33,51],"Cerebras":[35],"CS-2,":[36],"where":[37],"usage":[39],"extends":[40],"beyond":[41],"Wafer-Scale":[43],"Engine":[44],"(WSE)":[45],"to":[46,92,123,164],"include":[47],"supporting":[48],"infrastructure":[49],"management":[52],"nodes":[53,58,65],"that":[54,66,117],"coordinate":[55],"workflows,":[56],"worker":[57],"responsible":[59],"data":[61],"streaming,":[62],"and":[63,70,111,129,155,167],"MemoryX":[64],"handle":[67],"weight":[68],"updates":[69],"parameter":[71],"transfers.":[72],"Conventional":[73],"GPU-centric":[74],"profiling":[75],"approaches":[76],"overlook":[77],"these":[78],"contributors,":[79],"providing":[80],"an":[81],"incomplete":[82],"view":[83],"total":[85,126],"system":[86,127],"efficiency.":[87],"Leveraging":[88],"administrative":[89],"telemetry":[90],"access":[91],"dedicated":[94],"CS-2":[95],"installation,":[96],"this":[97],"study":[98],"presents":[99],"comprehensive":[101],"end-to-end":[102],"analysis":[103],"all":[108],"major":[109],"subsystems":[110],"computational":[112],"phases.":[113],"results":[115],"show":[116],"non-WSE":[118],"components":[119],"account":[120],"up":[122],"10%":[124],"exhibit":[130],"strong":[131],"temporal":[132],"coupling":[133],"with":[134],"accelerator.":[136],"These":[137],"findings":[138],"necessity":[141],"adopting":[143],"system-level":[145],"perspective":[146],"when":[147],"evaluating":[148],"efficiency":[150],"in":[151],"AI":[153],"systems":[154],"motivate":[156],"developing":[157],"tools":[158],"fine-grained,":[160],"phase-aware":[161],"measurements":[163],"improve":[165],"transparency":[166],"sustainability.":[168]},"counts_by_year":[],"updated_date":"2026-02-23T20:09:44.859080","created_date":"2026-01-23T00:00:00"}
