{"id":"https://openalex.org/W2322230929","doi":"https://doi.org/10.1109/hpca.2016.7446063","title":"Approximating warps with intra-warp operand value similarity","display_name":"Approximating warps with intra-warp operand value similarity","publication_year":2016,"publication_date":"2016-03-01","ids":{"openalex":"https://openalex.org/W2322230929","doi":"https://doi.org/10.1109/hpca.2016.7446063","mag":"2322230929"},"language":"en","primary_location":{"id":"doi:10.1109/hpca.2016.7446063","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca.2016.7446063","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000712719","display_name":"Daniel Wong","orcid":"https://orcid.org/0000-0002-5376-7868"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"education","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Daniel Wong","raw_affiliation_strings":["University of California, Riverside"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, Riverside","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037648751","display_name":"Nam Sung Kim","orcid":"https://orcid.org/0000-0002-0442-5634"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nam Sung Kim","raw_affiliation_strings":["University of Illinois, Urbana-Champaign"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Illinois, Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018033573","display_name":"Murali Annavaram","orcid":"https://orcid.org/0000-0002-4633-6867"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I2800817003","display_name":"California Southern University","ror":"https://ror.org/058zz0t50","country_code":"US","type":"education","lineage":["https://openalex.org/I2800817003"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Murali Annavaram","raw_affiliation_strings":["University of Southern California"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Southern California","institution_ids":["https://openalex.org/I2800817003","https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":7.05,"has_fulltext":false,"cited_by_count":45,"citation_normalized_percentile":{"value":0.97406733,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"176","last_page":"187"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/operand","display_name":"Operand","score":0.8922989368438721},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7168868780136108},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7151458263397217},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.5895386934280396},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.5554065108299255},{"id":"https://openalex.org/keywords/massively-parallel","display_name":"Massively parallel","score":0.5059134364128113},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4686300754547119},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.43976426124572754},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1288549304008484},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.11310872435569763}],"concepts":[{"id":"https://openalex.org/C55526617","wikidata":"https://www.wikidata.org/wiki/Q719375","display_name":"Operand","level":2,"score":0.8922989368438721},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7168868780136108},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7151458263397217},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.5895386934280396},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.5554065108299255},{"id":"https://openalex.org/C190475519","wikidata":"https://www.wikidata.org/wiki/Q544384","display_name":"Massively parallel","level":2,"score":0.5059134364128113},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4686300754547119},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.43976426124572754},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1288549304008484},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.11310872435569763},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca.2016.7446063","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca.2016.7446063","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.9100000262260437,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320332195","display_name":"Samsung","ror":"https://ror.org/04w3jy968"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W1492552760","https://openalex.org/W1979527452","https://openalex.org/W1991518265","https://openalex.org/W1996037679","https://openalex.org/W2005506050","https://openalex.org/W2020517863","https://openalex.org/W2026186397","https://openalex.org/W2026764611","https://openalex.org/W2037898879","https://openalex.org/W2038178246","https://openalex.org/W2057434193","https://openalex.org/W2080592089","https://openalex.org/W2089854225","https://openalex.org/W2090584832","https://openalex.org/W2093043622","https://openalex.org/W2095667776","https://openalex.org/W2095872092","https://openalex.org/W2097243222","https://openalex.org/W2097652499","https://openalex.org/W2114703523","https://openalex.org/W2118826546","https://openalex.org/W2119299853","https://openalex.org/W2125452276","https://openalex.org/W2130681828","https://openalex.org/W2138761132","https://openalex.org/W2142883190","https://openalex.org/W2143283746","https://openalex.org/W2146065717","https://openalex.org/W2149234156","https://openalex.org/W2154693467","https://openalex.org/W2161910890","https://openalex.org/W2166250385","https://openalex.org/W2166773037","https://openalex.org/W2167258273","https://openalex.org/W2168429197","https://openalex.org/W2170382128","https://openalex.org/W2170881177","https://openalex.org/W2187230075","https://openalex.org/W3004111065","https://openalex.org/W4205391132","https://openalex.org/W4205579859","https://openalex.org/W4240237526","https://openalex.org/W4244884309","https://openalex.org/W4248185003","https://openalex.org/W4250075075","https://openalex.org/W4251054771","https://openalex.org/W4253048710","https://openalex.org/W4253750843","https://openalex.org/W4254893742","https://openalex.org/W6678014459","https://openalex.org/W7006594605"],"related_works":["https://openalex.org/W2556282987","https://openalex.org/W1533508804","https://openalex.org/W2050923821","https://openalex.org/W1970370079","https://openalex.org/W2333680585","https://openalex.org/W2098637578","https://openalex.org/W1999746819","https://openalex.org/W1996625680","https://openalex.org/W4378651692","https://openalex.org/W4236954329"],"abstract_inverted_index":{"Value":[0,19],"locality,":[1],"the":[2,10,22,33,43,49,60,117,141,150],"recurrence":[3],"of":[4,12,24,45,62,68,115],"a":[5,66,109,121,125,145],"previously-seen":[6],"value,":[7],"has":[8],"been":[9],"enabler":[11],"myriad":[13],"optimization":[14],"techniques":[15],"in":[16,32,59,79,105,120,140],"traditional":[17],"processors.":[18],"similarity":[20,58,70,90,104],"relaxes":[21],"constraint":[23],"value":[25,57,69,74,89,103,127,130,134,146],"locality":[26],"by":[27,169,174,182],"allowing":[28],"values":[29,38],"to":[30,91],"differ":[31],"lowest":[34],"significant":[35],"bits":[36],"where":[37],"are":[39],"micro-architecturally":[40],"near.":[41],"With":[42,160],"end":[44],"Dennard":[46],"Scaling":[47],"and":[48,107,152,176],"turn":[50],"towards":[51],"massively":[52],"parallel":[53],"accelerators,":[54],"we":[55,163],"revisit":[56],"context":[61],"GPUs.":[63,80],"We":[64,81],"identify":[65],"form":[67],"called":[71],"intra-warp":[72,87,101],"operand":[73,88,102],"similarity,":[75],"which":[76,85],"is":[77],"abundant":[78],"present":[82],"Warp":[83,97,161],"Approximation,":[84,162],"leverages":[86],"trade":[92],"off":[93],"accuracy":[94],"for":[95],"energy.":[96],"Approximation":[98],"dynamically":[99],"identifies":[100],"hardware,":[106],"executes":[108],"single":[110],"representative":[111,126,133],"thread":[112],"on":[113],"behalf":[114],"all":[116],"active":[118],"threads":[119],"warp,":[122],"thereby":[123],"producing":[124],"with":[128,157,184],"approximate":[129,158],"locality.":[131],"This":[132],"can":[135,164],"then":[136],"be":[137],"stored":[138],"compactly":[139],"register":[142,171],"file":[143,172],"as":[144],"similar":[147],"scalar,":[148],"reducing":[149],"read":[151],"write":[153],"energy":[154,168,173,180],"when":[155],"dealing":[156],"data.":[159],"reduce":[165],"execution":[166],"unit":[167],"37%,":[170],"28%,":[175],"improve":[177],"overall":[178],"GPGPU":[179],"efficiency":[181],"26%":[183],"minimal":[185],"quality":[186],"degradation.":[187]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":8},{"year":2017,"cited_by_count":8},{"year":2016,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
