{"id":"https://openalex.org/W2117457971","doi":"https://doi.org/10.1145/2001269.2001291","title":"Understanding sources of ineffciency in general-purpose chips","display_name":"Understanding sources of ineffciency in general-purpose chips","publication_year":2011,"publication_date":"2011-09-23","ids":{"openalex":"https://openalex.org/W2117457971","doi":"https://doi.org/10.1145/2001269.2001291","mag":"2117457971"},"language":"en","primary_location":{"id":"doi:10.1145/2001269.2001291","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2001269.2001291","pdf_url":null,"source":{"id":"https://openalex.org/S103482838","display_name":"Communications of the ACM","issn_l":"0001-0782","issn":["0001-0782","1557-7317"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications of the ACM","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111517327","display_name":"Rehan Hameed","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Rehan Hameed","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056488298","display_name":"Wajahat Qadeer","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wajahat Qadeer","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071780189","display_name":"Megan Wachs","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Megan Wachs","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035434738","display_name":"Omid Azizi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Omid Azizi","raw_affiliation_strings":["Hicamp Systems, Menlo Park, CA"],"affiliations":[{"raw_affiliation_string":"Hicamp Systems, Menlo Park, CA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000964076","display_name":"Alex Solomatnikov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alex Solomatnikov","raw_affiliation_strings":["Hicamp Systems, Menlo Park, CA"],"affiliations":[{"raw_affiliation_string":"Hicamp Systems, Menlo Park, CA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003811456","display_name":"Benjamin C. Lee","orcid":"https://orcid.org/0000-0003-4472-6375"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Benjamin C. Lee","raw_affiliation_strings":["Duke University, Durham, NC"],"affiliations":[{"raw_affiliation_string":"Duke University, Durham, NC","institution_ids":["https://openalex.org/I170897317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059607447","display_name":"Stephen Richardson","orcid":"https://orcid.org/0000-0003-4359-3638"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Stephen Richardson","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042148531","display_name":"Christos Kozyrakis","orcid":"https://orcid.org/0000-0002-3154-7530"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christos Kozyrakis","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090469068","display_name":"Mark Horowitz","orcid":"https://orcid.org/0000-0003-3245-7542"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mark Horowitz","raw_affiliation_strings":["Stanford University, Stanford, CA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5111517327"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":4.0298,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.94530877,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"54","issue":"10","first_page":"85","last_page":"93"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11522","display_name":"VLSI and FPGA Design Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/application-specific-integrated-circuit","display_name":"Application-specific integrated circuit","score":0.8263970613479614},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8210399150848389},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.6646353006362915},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.6564090251922607},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.582101583480835},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.4975438416004181},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.4724082350730896},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.46868613362312317},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4232363998889923},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.37361422181129456},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.225886732339859},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.1086118221282959},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07899445295333862}],"concepts":[{"id":"https://openalex.org/C77390884","wikidata":"https://www.wikidata.org/wiki/Q217302","display_name":"Application-specific integrated circuit","level":2,"score":0.8263970613479614},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8210399150848389},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.6646353006362915},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.6564090251922607},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.582101583480835},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.4975438416004181},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.4724082350730896},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.46868613362312317},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4232363998889923},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.37361422181129456},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.225886732339859},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.1086118221282959},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07899445295333862},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2001269.2001291","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2001269.2001291","pdf_url":null,"source":{"id":"https://openalex.org/S103482838","display_name":"Communications of the ACM","issn_l":"0001-0782","issn":["0001-0782","1557-7317"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications of the ACM","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8999999761581421,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G7181103621","display_name":null,"funder_award_id":"937060","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320308633","display_name":"Computing Research Association","ror":"https://ror.org/00agrkd75"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1535772895","https://openalex.org/W1967320979","https://openalex.org/W1982008951","https://openalex.org/W1990832096","https://openalex.org/W2006312753","https://openalex.org/W2014173115","https://openalex.org/W2089244779","https://openalex.org/W2096910408","https://openalex.org/W2111488604","https://openalex.org/W2115547150","https://openalex.org/W2120771707","https://openalex.org/W2128765420","https://openalex.org/W2132729131","https://openalex.org/W2145905710","https://openalex.org/W2153416280","https://openalex.org/W2154051217","https://openalex.org/W2170909854","https://openalex.org/W2623012778","https://openalex.org/W2989908748","https://openalex.org/W4247949726","https://openalex.org/W4249497434","https://openalex.org/W4388624454"],"related_works":["https://openalex.org/W2534771569","https://openalex.org/W2037547261","https://openalex.org/W4311812695","https://openalex.org/W2117788426","https://openalex.org/W4242015792","https://openalex.org/W3011583392","https://openalex.org/W2291920536","https://openalex.org/W2164535554","https://openalex.org/W2133317661","https://openalex.org/W2136725475"],"abstract_inverted_index":{"Scaling":[0],"the":[1,10,42,45,68,84,96,137,160,203,208],"performance":[2,46,117,167,210],"of":[3,44,50,159,176,186,189,200,214],"a":[4,51,58,99,149,180],"power":[5],"limited":[6],"processor":[7,28],"requires":[8,170],"decreasing":[9],"energy":[11,48,74,122,161,195,218],"expended":[12],"per":[13,156,191],"instruction":[14],"executed,":[15],"since":[16],"energy/op":[17],"*":[18],"op/second":[19],"is":[20,30,126,135,162],"power.":[21],"To":[22],"better":[23],"understand":[24],"what":[25,33],"improvement":[26],"in":[27,141,219],"efficiency":[29],"possible,":[31],"and":[32,47,121,168,202,211],"must":[34],"be":[35],"done":[36],"to":[37,90],"capture":[38],"it,":[39],"we":[40,178],"quantify":[41],"sources":[43],"overheads":[49,65,93],"720p":[52],"HD":[53],"H.264":[54,103,142],"encoder":[55],"running":[56],"on":[57],"general-purpose":[59],"four-processor":[60],"CMP":[61,69,116,206],"system.":[62],"The":[63,133],"initial":[64],"are":[66,143],"large:":[67],"was":[70],"500":[71],"x":[72,120],"less":[73],"efficient":[75],"than":[76,130],"an":[77,131,215],"Application":[78],"Specific":[79],"Integrated":[80],"Circuit":[81],"(ASIC)":[82],"doing":[83,152],"same":[85,209],"job.":[86],"We":[87],"explore":[88],"methods":[89],"eliminate":[91],"these":[92],"by":[94,118,123,197],"transforming":[95],"CPU":[97],"into":[98],"specialized":[100,182],"system":[101],"for":[102],"encoding.":[104],"Broadly":[105],"applicable":[106],"optimizations":[107],"like":[108],"single":[109],"instruction,":[110],"multiple":[111],"data":[112],"(SIMD)":[113],"units":[114],"improve":[115],"14":[119],"10x,":[124],"which":[125],"still":[127,163],"50x":[128],"worse":[129],"ASIC.":[132],"problem":[134],"that":[136,146],"basic":[138],"operation":[139],"costs":[140],"so":[144],"small":[145],"even":[147],"with":[148],"SIMD":[150],"unit":[151,184],"over":[153],"10":[154],"ops":[155],"cycle,":[157],"90%":[158],"overhead.":[164],"Achieving":[165],"ASIC-like":[166],"effciency":[169,196],"algorithm-specifc":[171],"optimizations.":[172],"For":[173],"each":[174],"subalgorithm":[175],"H.264,":[177],"create":[179],"large,":[181],"functional/storage":[183],"capable":[185],"executing":[187],"hundreds":[188],"operations":[190],"instruction.":[192],"This":[193],"improves":[194],"160x":[198],"(instead":[199],"10x),":[201],"final":[204],"customized":[205],"reaches":[207],"within":[212],"3x":[213],"ASIC":[216],"solution's":[217],"comparable":[220],"area.":[221]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":9},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
