{"id":"https://openalex.org/W7155360351","doi":"https://doi.org/10.48550/arxiv.2604.20105","title":"EnergAIzer: Fast and Accurate GPU Power Estimation Framework for AI Workloads","display_name":"EnergAIzer: Fast and Accurate GPU Power Estimation Framework for AI Workloads","publication_year":2026,"publication_date":"2026-04-22","ids":{"openalex":"https://openalex.org/W7155360351","doi":"https://doi.org/10.48550/arxiv.2604.20105"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.20105","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20105","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.20105","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134396358","display_name":"Kyungmi Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Kyungmi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050263836","display_name":"Zhiye Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Zhiye","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134428349","display_name":"Eun Kyung Lee","orcid":"https://orcid.org/0000-0001-7334-2050"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Eun Kyung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134449583","display_name":"Xin Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134366457","display_name":"Tamar Eilam","orcid":"https://orcid.org/0009-0002-1992-8899"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eilam, Tamar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134445097","display_name":"Anantha P. Chandrakasan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chandrakasan, Anantha P.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.7738999724388123,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.7738999724388123,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.12229999899864197,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.0203000009059906,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.8729000091552734},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7493000030517578},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.6026999950408936},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6013000011444092},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.43790000677108765},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.3921999931335449},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.3783999979496002},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.3515999913215637}],"concepts":[{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.8729000091552734},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8199999928474426},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7493000030517578},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.6026999950408936},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6013000011444092},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.4440000057220459},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.43790000677108765},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.3921999931335449},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.38830000162124634},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3783999979496002},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3573000133037567},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.3515999913215637},{"id":"https://openalex.org/C168292644","wikidata":"https://www.wikidata.org/wiki/Q10860336","display_name":"Power optimization","level":4,"score":0.3325999975204468},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.32710000872612},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.322299987077713},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.32170000672340393},{"id":"https://openalex.org/C157742956","wikidata":"https://www.wikidata.org/wiki/Q3237776","display_name":"Frequency scaling","level":3,"score":0.3084999918937683},{"id":"https://openalex.org/C45872418","wikidata":"https://www.wikidata.org/wiki/Q5318966","display_name":"Dynamic demand","level":3,"score":0.3041999936103821},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.28769999742507935},{"id":"https://openalex.org/C118993495","wikidata":"https://www.wikidata.org/wiki/Q5042828","display_name":"Electrical efficiency","level":3,"score":0.2856999933719635},{"id":"https://openalex.org/C2778774385","wikidata":"https://www.wikidata.org/wiki/Q4437810","display_name":"Power management","level":3,"score":0.2847999930381775},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.26100000739097595},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2522999942302704},{"id":"https://openalex.org/C2778100165","wikidata":"https://www.wikidata.org/wiki/Q1589327","display_name":"Memory hierarchy","level":3,"score":0.25209999084472656}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.20105","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20105","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.20105","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20105","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.8423354625701904,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"As":[0],"AI":[1,94,201],"workloads":[2,95],"drive":[3],"increases":[4],"in":[5,28,34,93],"datacenter":[6],"power":[7,11,17,21,141,146,151,160,183,198],"consumption,":[8],"accurate":[9,197],"GPU":[10],"estimation":[12,81],"is":[13,90,136],"critical":[14],"for":[15,123,174,200,206],"proactive":[16],"management.":[18],"However,":[19],"existing":[20],"models":[22,161],"face":[23],"a":[24,72,113],"scalability":[25,68],"bottleneck":[26,69],"not":[27],"the":[29,36,80,182,204],"modeling":[30],"techniques":[31],"themselves,":[32],"but":[33],"obtaining":[35],"hardware":[37,50,167],"utilization":[38,77,135],"inputs":[39],"they":[40],"require.":[41],"Conventional":[42],"approaches":[43],"rely":[44],"on":[45,153],"either":[46],"costly":[47],"simulation":[48,165],"or":[49,166],"profiling,":[51],"which":[52,65,103,127],"makes":[53],"them":[54],"impractical":[55],"when":[56],"rapid":[57],"predictions":[58],"are":[59],"required.":[60],"This":[61,133],"work":[62],"presents":[63],"EnergAIzer,":[64],"addresses":[66],"this":[67],"by":[70],"developing":[71],"lightweight":[73],"solution":[74],"to":[75,85,143],"predict":[76],"inputs,":[78],"reducing":[79],"walltime":[82],"from":[83],"hours":[84],"seconds.":[86],"Our":[87],"key":[88],"insight":[89],"that":[91,99],"kernels":[92],"commonly":[96],"employ":[97],"optimizations":[98],"create":[100],"structured":[101],"patterns,":[102],"analytically":[104],"determine":[105],"memory":[106],"traffic":[107],"and":[108,177,196],"execution":[109],"timeline.":[110],"We":[111,169],"construct":[112],"performance":[114],"model":[115,142],"using":[116],"these":[117],"patterns":[118],"as":[119],"an":[120],"analytical":[121],"scaffold":[122],"empirical":[124],"data":[125],"fitting,":[126],"also":[128],"naturally":[129],"exposes":[130],"module-level":[131],"utilization.":[132],"predicted":[134],"then":[137],"fed":[138],"into":[139],"our":[140],"estimate":[144],"dynamic":[145],"consumption.":[147],"EnergAIzer":[148,193],"achieves":[149],"8%":[150],"errors":[152],"NVIDIA":[154,185],"Ampere":[155],"GPUs,":[156],"competitive":[157],"with":[158,162,187],"traditional":[159],"elaborate":[163],"cycle-level":[164],"profiling.":[168],"demonstrate":[170],"EnergAIzer's":[171],"exploration":[172],"capabilities":[173],"frequency":[175],"scaling":[176],"architectural":[178],"configurations,":[179],"including":[180],"forecasting":[181],"of":[184],"H100":[186],"just":[188],"7%":[189],"error.":[190],"In":[191],"summary,":[192],"provides":[194],"fast":[195],"prediction":[199],"workloads,":[202],"paving":[203],"way":[205],"power-aware":[207],"design":[208],"explorations.":[209]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-24T00:00:00"}
