{"id":"https://openalex.org/W2059301531","doi":"https://doi.org/10.1109/hpca.2013.6522337","title":"Warped register file: A power efficient register file for GPGPUs","display_name":"Warped register file: A power efficient register file for GPGPUs","publication_year":2013,"publication_date":"2013-02-01","ids":{"openalex":"https://openalex.org/W2059301531","doi":"https://doi.org/10.1109/hpca.2013.6522337","mag":"2059301531"},"language":"en","primary_location":{"id":"doi:10.1109/hpca.2013.6522337","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca.2013.6522337","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE 19th International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051502689","display_name":"Mohammad Abdel-Majeed","orcid":"https://orcid.org/0000-0002-0789-4479"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"M. Abdel-Majeed","raw_affiliation_strings":["Electrical Engineering Department, University of Southern California, Los Angeles, CA, USA","Electr. Eng. Dept., Univ. of Southern California, Los Angeles, CA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]},{"raw_affiliation_string":"Electr. Eng. Dept., Univ. of Southern California, Los Angeles, CA, USA#TAB#","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018033573","display_name":"Murali Annavaram","orcid":"https://orcid.org/0000-0002-4633-6867"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"M. Annavaram","raw_affiliation_strings":["Electrical Engineering Department, University of Southern California, Los Angeles, CA, USA","Electr. Eng. Dept., Univ. of Southern California, Los Angeles, CA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]},{"raw_affiliation_string":"Electr. Eng. Dept., Univ. of Southern California, Los Angeles, CA, USA#TAB#","institution_ids":["https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5051502689"],"corresponding_institution_ids":["https://openalex.org/I1174212"],"apc_list":null,"apc_paid":null,"fwci":18.5975,"has_fulltext":false,"cited_by_count":116,"citation_normalized_percentile":{"value":0.99571467,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"412","last_page":"423"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/register-file","display_name":"Register file","score":0.9773313403129578},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8713579773902893},{"id":"https://openalex.org/keywords/processor-register","display_name":"Processor register","score":0.7028543949127197},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6319035887718201},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.5006015300750732},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.47596949338912964},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.4259498715400696},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.3191062808036804},{"id":"https://openalex.org/keywords/memory-address","display_name":"Memory address","score":0.08987128734588623}],"concepts":[{"id":"https://openalex.org/C117280010","wikidata":"https://www.wikidata.org/wiki/Q180944","display_name":"Register file","level":3,"score":0.9773313403129578},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8713579773902893},{"id":"https://openalex.org/C2871975","wikidata":"https://www.wikidata.org/wiki/Q187466","display_name":"Processor register","level":4,"score":0.7028543949127197},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6319035887718201},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.5006015300750732},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.47596949338912964},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.4259498715400696},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.3191062808036804},{"id":"https://openalex.org/C153247305","wikidata":"https://www.wikidata.org/wiki/Q835713","display_name":"Memory address","level":3,"score":0.08987128734588623},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca.2013.6522337","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca.2013.6522337","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE 19th International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.8999999761581421,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W347657323","https://openalex.org/W1979527452","https://openalex.org/W1980364632","https://openalex.org/W2009511314","https://openalex.org/W2024001079","https://openalex.org/W2045110768","https://openalex.org/W2057404685","https://openalex.org/W2062603907","https://openalex.org/W2065770937","https://openalex.org/W2089363288","https://openalex.org/W2090584832","https://openalex.org/W2091559310","https://openalex.org/W2096661534","https://openalex.org/W2097085895","https://openalex.org/W2112569346","https://openalex.org/W2116588741","https://openalex.org/W2119220373","https://openalex.org/W2125647168","https://openalex.org/W2131054871","https://openalex.org/W2138777150","https://openalex.org/W2139433465","https://openalex.org/W2143668295","https://openalex.org/W2157275977","https://openalex.org/W4241620505","https://openalex.org/W4245021564","https://openalex.org/W4246117596","https://openalex.org/W4248310916","https://openalex.org/W6677494409","https://openalex.org/W6681126484"],"related_works":["https://openalex.org/W2224192221","https://openalex.org/W1482836228","https://openalex.org/W2356166161","https://openalex.org/W2014882201","https://openalex.org/W3144620029","https://openalex.org/W2009783759","https://openalex.org/W2103008217","https://openalex.org/W1521414776","https://openalex.org/W4245282684","https://openalex.org/W74994880"],"abstract_inverted_index":{"General":[0],"purpose":[1],"graphics":[2],"processing":[3],"units":[4],"(GPGPUs)":[5],"have":[6,221],"the":[7,33,41,46,53,63,99,107,124,236,241,247,251],"ability":[8],"to":[9,31,86,97,122,151,214],"execute":[10],"hundreds":[11],"of":[12,35,45,71,112,203,250],"concurrent":[13],"threads.":[14,224],"To":[15,182],"support":[16],"massive":[17],"parallelism":[18,216],"GPGPUs":[19,84],"provide":[20],"a":[21,29,59,72,116,152,162,211],"very":[22],"large":[23,88],"register":[24,54,73,89,101,118,153,163,252],"file,":[25],"even":[26],"larger":[27],"than":[28],"cache,":[30],"hold":[32],"state":[34,142,166],"each":[36,145,169],"thread.":[37],"As":[38,62],"technology":[39],"scales,":[40],"leakage":[42,125,176],"power":[43,57,69,103,177,185,248],"consumption":[44,58,70,249],"SRAM":[47],"cells":[48],"is":[49,75,154],"getting":[50],"worse":[51],"making":[52],"file":[55,74,90,102,253],"static":[56],"major":[60],"concern.":[61],"supply":[64],"voltage":[65],"scaling":[66],"slows,":[67],"dynamic":[68,184],"not":[76],"reducing.":[77],"These":[78],"concerns":[79],"are":[80],"particularly":[81],"acute":[82],"in":[83,157,172,175],"due":[85],"their":[87],"size.":[91],"This":[92,127],"paper":[93,187],"presents":[94],"two":[95,242],"techniques":[96,243],"reduce":[98,123,183],"GPGPU":[100],"consumption.":[104],"By":[105,239],"exploiting":[106],"unique":[108],"software":[109],"execution":[110],"model":[111],"GPGPUs,":[113],"we":[114,244],"propose":[115],"tri-modal":[117],"access":[119,170],"control":[120],"unit":[121,128,195],"power.":[126],"first":[129],"turns":[130],"off":[131],"any":[132],"unallocated":[133],"register,":[134],"and":[135,201,217],"places":[136],"all":[137,207],"allocated":[138],"registers":[139,204,226],"into":[140,164],"drowsy":[141,165],"immediately":[143,167],"after":[144,168],"access.":[146],"The":[147],"average":[148],"inter-access":[149],"distance":[150],"789":[155],"cycles":[156],"GPGPUs.":[158],"Hence,":[159,225],"aggressively":[160],"moving":[161],"results":[171],"90%":[173],"reduction":[174],"with":[178,206,228],"negligible":[179],"performance":[180],"impact.":[181],"this":[186],"proposes":[188],"an":[189],"active":[190,237],"mask":[191],"aware":[192],"activity":[193],"gating":[194],"that":[196,246],"avoids":[197],"charging":[198],"bit":[199],"lines":[200],"wordlines":[202],"associated":[205,227],"inactive":[208,223,229],"threads":[209,230],"within":[210],"warp.":[212],"Due":[213],"insufficient":[215],"branch":[218],"divergence":[219],"warps":[220],"many":[222],"can":[231,254],"be":[232,255],"identified":[233],"precisely":[234],"using":[235],"mask.":[238],"combining":[240],"show":[245],"reduced":[256],"by":[257],"69%":[258],"on":[259],"average.":[260]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":10},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":11},{"year":2017,"cited_by_count":16},{"year":2016,"cited_by_count":24},{"year":2015,"cited_by_count":19},{"year":2014,"cited_by_count":12},{"year":2013,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
