{"id":"https://openalex.org/W2235375535","doi":"https://doi.org/10.1145/2830772.2830811","title":"Safe limits on voltage reduction efficiency in GPUs","display_name":"Safe limits on voltage reduction efficiency in GPUs","publication_year":2015,"publication_date":"2015-12-05","ids":{"openalex":"https://openalex.org/W2235375535","doi":"https://doi.org/10.1145/2830772.2830811","mag":"2235375535"},"language":"en","primary_location":{"id":"doi:10.1145/2830772.2830811","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2830772.2830811","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2830772.2830811","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International Symposium on Microarchitecture","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/2830772.2830811","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003939279","display_name":"Jingwen Leng","orcid":"https://orcid.org/0000-0002-5660-5493"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jingwen Leng","raw_affiliation_strings":["The University of Texas at Austin and IBM T.J. Watson Research Center"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin and IBM T.J. Watson Research Center","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044824009","display_name":"Alper Buyuktosunoglu","orcid":"https://orcid.org/0000-0002-5341-8916"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alper Buyuktosunoglu","raw_affiliation_strings":["IBM T.J. Watson Research Center"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM T.J. Watson Research Center","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017228661","display_name":"Ramon Bertran","orcid":"https://orcid.org/0000-0001-8297-1844"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramon Bertran","raw_affiliation_strings":["IBM T.J. Watson Research Center"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM T.J. Watson Research Center","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009866527","display_name":"Pradip Bose","orcid":"https://orcid.org/0000-0002-1380-5671"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pradip Bose","raw_affiliation_strings":["IBM T.J. Watson Research Center"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM T.J. Watson Research Center","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000635267","display_name":"Vijay Janapa Reddi","orcid":"https://orcid.org/0000-0002-5259-7721"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vijay Janapa Reddi","raw_affiliation_strings":["The University of Texas at Austin"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":8.5653,"has_fulltext":true,"cited_by_count":76,"citation_normalized_percentile":{"value":0.98151986,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"294","last_page":"307"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10363","display_name":"Low-power high-performance VLSI design","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7728078961372375},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.6865313649177551},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6291568875312805},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.5554121732711792},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5054497718811035},{"id":"https://openalex.org/keywords/limit","display_name":"Limit (mathematics)","score":0.46934258937835693},{"id":"https://openalex.org/keywords/microprocessor","display_name":"Microprocessor","score":0.46626147627830505},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.45255813002586365},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4453135132789612},{"id":"https://openalex.org/keywords/voltage-reduction","display_name":"Voltage reduction","score":0.44092857837677},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.42901045083999634},{"id":"https://openalex.org/keywords/microarchitecture","display_name":"Microarchitecture","score":0.41270673274993896},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3841736614704132},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1270047426223755},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.09768983721733093}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7728078961372375},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.6865313649177551},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6291568875312805},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.5554121732711792},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5054497718811035},{"id":"https://openalex.org/C151201525","wikidata":"https://www.wikidata.org/wiki/Q177239","display_name":"Limit (mathematics)","level":2,"score":0.46934258937835693},{"id":"https://openalex.org/C2780728072","wikidata":"https://www.wikidata.org/wiki/Q5297","display_name":"Microprocessor","level":2,"score":0.46626147627830505},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.45255813002586365},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4453135132789612},{"id":"https://openalex.org/C2780745134","wikidata":"https://www.wikidata.org/wiki/Q7940751","display_name":"Voltage reduction","level":3,"score":0.44092857837677},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.42901045083999634},{"id":"https://openalex.org/C107598950","wikidata":"https://www.wikidata.org/wiki/Q259864","display_name":"Microarchitecture","level":2,"score":0.41270673274993896},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3841736614704132},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1270047426223755},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.09768983721733093},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2830772.2830811","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2830772.2830811","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2830772.2830811","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International Symposium on Microarchitecture","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/2830772.2830811","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2830772.2830811","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2830772.2830811","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International Symposium on Microarchitecture","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.8999999761581421,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G1945030456","display_name":null,"funder_award_id":"HR0011-13-C-0022","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G3621590539","display_name":null,"funder_award_id":"HR0011-13-C-0022","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5268805254","display_name":null,"funder_award_id":"CCF-1218474","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5805915551","display_name":"SHF: Small: Cross-Layer Solutions for Sustainable and Reliable Computing Systems","funder_award_id":"1218474","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306078","display_name":"U.S. Department of Defense","ror":"https://ror.org/0447fe631"},{"id":"https://openalex.org/F4320306087","display_name":"Semiconductor Research Corporation","ror":"https://ror.org/047z4n946"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320332815","display_name":"Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2235375535.pdf","grobid_xml":"https://content.openalex.org/works/W2235375535.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W1621319046","https://openalex.org/W1977476862","https://openalex.org/W1981384041","https://openalex.org/W1982700323","https://openalex.org/W1985918920","https://openalex.org/W1989061323","https://openalex.org/W1994172067","https://openalex.org/W1994805710","https://openalex.org/W1997162567","https://openalex.org/W2003128690","https://openalex.org/W2017099699","https://openalex.org/W2023304380","https://openalex.org/W2049303720","https://openalex.org/W2079706534","https://openalex.org/W2080592089","https://openalex.org/W2093043622","https://openalex.org/W2096486545","https://openalex.org/W2098163907","https://openalex.org/W2104677471","https://openalex.org/W2105560148","https://openalex.org/W2117608378","https://openalex.org/W2120405872","https://openalex.org/W2124256021","https://openalex.org/W2129904319","https://openalex.org/W2130720335","https://openalex.org/W2136944230","https://openalex.org/W2146731180","https://openalex.org/W2147042877","https://openalex.org/W2148952606","https://openalex.org/W2156331292","https://openalex.org/W2156665896","https://openalex.org/W2167244863","https://openalex.org/W3018239767","https://openalex.org/W3143229551","https://openalex.org/W3149376625"],"related_works":["https://openalex.org/W1667647204","https://openalex.org/W2404647514","https://openalex.org/W4247536566","https://openalex.org/W4241418540","https://openalex.org/W2018477250","https://openalex.org/W3119814709","https://openalex.org/W1508895727","https://openalex.org/W2725786787","https://openalex.org/W1590965489","https://openalex.org/W2348548806"],"abstract_inverted_index":{"Energy":[0],"efficiency":[1],"of":[2,11,23,77,184],"GPU":[3,26,45,80],"architectures":[4],"has":[5,122],"emerged":[6],"as":[7],"an":[8],"important":[9],"aspect":[10],"computer":[12],"system":[13],"design.":[14],"In":[15],"this":[16],"paper,":[17],"we":[18,149],"explore":[19],"the":[20,25,30,78,88,103,111,119,130,136,139,198,202],"energy":[21,73],"benefits":[22],"reducing":[24],"chip's":[27],"voltage":[28,54,120,144,199],"to":[29,71,129,152,159],"safe":[31],"limit,":[32],"i.e.":[33],"Vmin":[34,100,113,127,162,178],"point.":[35],"We":[36,47,106,115],"perform":[37],"such":[38],"a":[39,97,123,154,185,208],"study":[40],"on":[41,56,75,87,126],"several":[42],"commercial":[43],"off-the-shelf":[44],"cards.":[46,81],"find":[48],"that":[49,118],"there":[50],"exists":[51],"about":[52,110],"20%":[53],"guardband":[55],"those":[57],"GPUs":[58],"spanning":[59],"two":[60],"architectural":[61],"generations,":[62],"which,":[63],"if":[64],"\"eliminated\"":[65],"completely,":[66],"can":[67],"result":[68],"in":[69,192],"up":[70,181],"25%":[72],"savings":[74],"one":[76],"studied":[79,104],"The":[82,165,176],"exact":[83],"improvement":[84],"magnitude":[85],"depends":[86],"program's":[89],"available":[90],"guardband,":[91,200],"because":[92],"our":[93],"measurement":[94],"results":[95],"unveil":[96],"program":[98],"dependent":[99],"behavior":[101],"across":[102],"programs.":[105],"make":[107],"fundamental":[108],"observations":[109],"program-dependent":[112],"behavior.":[114],"experimentally":[116],"determine":[117],"noise":[121],"larger":[124],"impact":[125],"compared":[128],"process":[131],"and":[132,135,167,173,196],"temperature":[133],"variation,":[134],"activities":[137],"during":[138],"kernel":[140],"execution":[141],"cause":[142],"large":[143],"droops.":[145],"From":[146],"these":[147],"findings,":[148],"show":[150],"how":[151],"use":[153],"kernel's":[155],"microarchitectural":[156],"performance":[157],"counters":[158],"predict":[160],"its":[161],"value":[163],"accurately.":[164],"average":[166],"maximum":[168],"prediction":[169,179],"errors":[170],"are":[171],"0.5%":[172],"3%,":[174],"respectively.":[175],"accurate":[177],"opens":[180],"new":[182],"possibilities":[183],"cross-layer":[186],"dynamic":[187],"guardbanding":[188],"scheme":[189],"for":[190],"GPUs,":[191],"which":[193],"software":[194],"predicts":[195],"manages":[197],"while":[201],"functional":[203],"correctness":[204],"is":[205],"ensured":[206],"by":[207],"hardware":[209],"safety":[210],"net":[211],"mechanism.":[212]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":11},{"year":2020,"cited_by_count":14},{"year":2019,"cited_by_count":9},{"year":2018,"cited_by_count":14},{"year":2017,"cited_by_count":7},{"year":2016,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
