{"id":"https://openalex.org/W3137551601","doi":"https://doi.org/10.1109/pact.2013.6618806","title":"Neither more nor less: optimizing thread-level parallelism for GPGPUs","display_name":"Neither more nor less: optimizing thread-level parallelism for GPGPUs","publication_year":2013,"publication_date":"2013-10-01","ids":{"openalex":"https://openalex.org/W3137551601","doi":"https://doi.org/10.1109/pact.2013.6618806","mag":"3137551601"},"language":"en","primary_location":{"id":"doi:10.1109/pact.2013.6618806","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact.2013.6618806","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd International Conference on Parallel Architectures and Compilation Techniques","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/2117/21383","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032189355","display_name":"Jos\u00e9-Mar\u00eda Arnau","orcid":null},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Jose-Maria Arnau","raw_affiliation_strings":["Computer Architecture Department, Universitat Politecnica de Catalunya, Spain"],"affiliations":[{"raw_affiliation_string":"Computer Architecture Department, Universitat Politecnica de Catalunya, Spain","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054367087","display_name":"Joan-Manuel Parcerisa","orcid":"https://orcid.org/0000-0001-5771-8118"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Joan-Manuel Parcerisa","raw_affiliation_strings":["Computer Architecture Department, Universitat Politecnica de Catalunya, Spain"],"affiliations":[{"raw_affiliation_string":"Computer Architecture Department, Universitat Politecnica de Catalunya, Spain","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048196769","display_name":"Polychronis Xekalakis","orcid":null},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Polychronis Xekalakis","raw_affiliation_strings":["Intel Laboratories, Intel Corporation, USA"],"affiliations":[{"raw_affiliation_string":"Intel Laboratories, Intel Corporation, USA","institution_ids":["https://openalex.org/I1343180700"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5032189355"],"corresponding_institution_ids":["https://openalex.org/I9617848"],"apc_list":null,"apc_paid":null,"fwci":11.0324,"has_fulltext":false,"cited_by_count":89,"citation_normalized_percentile":{"value":0.98651906,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"157","last_page":"166"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8868339657783508},{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.669097363948822},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6521193981170654},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5787402391433716},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.5631975531578064},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.5290870666503906},{"id":"https://openalex.org/keywords/locality-of-reference","display_name":"Locality of reference","score":0.5087469220161438},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.49222293496131897},{"id":"https://openalex.org/keywords/frame-rate","display_name":"Frame rate","score":0.482204794883728},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.43889275193214417},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4124370217323303},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.38138651847839355},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.35585665702819824},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.3425498604774475},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.26411008834838867},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.2548145055770874},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.22262966632843018},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.11665794253349304},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.10461157560348511}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8868339657783508},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.669097363948822},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6521193981170654},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5787402391433716},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.5631975531578064},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.5290870666503906},{"id":"https://openalex.org/C27602214","wikidata":"https://www.wikidata.org/wiki/Q1868547","display_name":"Locality of reference","level":3,"score":0.5087469220161438},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.49222293496131897},{"id":"https://openalex.org/C3261483","wikidata":"https://www.wikidata.org/wiki/Q119565","display_name":"Frame rate","level":2,"score":0.482204794883728},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.43889275193214417},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4124370217323303},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.38138651847839355},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.35585665702819824},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3425498604774475},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.26411008834838867},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.2548145055770874},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.22262966632843018},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.11665794253349304},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.10461157560348511},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/pact.2013.6618806","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact.2013.6618806","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd International Conference on Parallel Architectures and Compilation Techniques","raw_type":"proceedings-article"},{"id":"pmh:oai:upcommons.upc.edu:2117/21383","is_oa":true,"landing_page_url":"http://hdl.handle.net/2117/21383","pdf_url":null,"source":{"id":"https://openalex.org/S4377196262","display_name":"UPCommons institutional repository (Universitat Polit\u00e8cnica de Catalunya)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9617848","host_organization_name":"Universitat Polit\u00e8cnica de Catalunya","host_organization_lineage":["https://openalex.org/I9617848"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"pmh:oai:upcommons.upc.edu:2117/21383","is_oa":true,"landing_page_url":"http://hdl.handle.net/2117/21383","pdf_url":null,"source":{"id":"https://openalex.org/S4377196262","display_name":"UPCommons institutional repository (Universitat Polit\u00e8cnica de Catalunya)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9617848","host_organization_name":"Universitat Polit\u00e8cnica de Catalunya","host_organization_lineage":["https://openalex.org/I9617848"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"},"sustainable_development_goals":[{"score":0.9100000262260437,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1516629665","https://openalex.org/W1768994003","https://openalex.org/W1807158275","https://openalex.org/W1964807684","https://openalex.org/W1967650867","https://openalex.org/W1978085843","https://openalex.org/W1982777001","https://openalex.org/W1985286038","https://openalex.org/W2032677397","https://openalex.org/W2068909745","https://openalex.org/W2089848273","https://openalex.org/W2097551900","https://openalex.org/W2099583675","https://openalex.org/W2153048208","https://openalex.org/W2170382128","https://openalex.org/W3023473353","https://openalex.org/W3146468402","https://openalex.org/W6630955060","https://openalex.org/W6638045046","https://openalex.org/W6644702558","https://openalex.org/W6667846312","https://openalex.org/W6673229790"],"related_works":["https://openalex.org/W1555349535","https://openalex.org/W2583128298","https://openalex.org/W2053359564","https://openalex.org/W2161159383","https://openalex.org/W1495260638","https://openalex.org/W1511204342","https://openalex.org/W2369125128","https://openalex.org/W2369223577","https://openalex.org/W2010020348","https://openalex.org/W1982580072"],"abstract_inverted_index":{"Perhaps":[0],"one":[1],"of":[2,39,45,52,67,113,122,177,194,244,256,286],"the":[3,27,42,75,87,98,111,116,129,135,159,174,191,195,213,233,263,267,272],"most":[4],"important":[5],"design":[6,253],"aspects":[7],"for":[8,48,202,217],"smartphones":[9],"and":[10,115],"tablets":[11],"is":[12,60,228,239],"improving":[13,41,123,187],"their":[14,90],"energy":[15,43,130],"efficiency.":[16],"Unfortunately,":[17],"rich":[18],"media":[19],"content":[20],"applications":[21],"typically":[22],"put":[23],"significant":[24,65],"pressure":[25],"to":[26,72,84,97,103,127,182,198,209,261],"GPU's":[28],"memory":[29,68,117,184,287],"subsystem.":[30],"In":[31,125],"this":[32,49,206,227],"paper":[33],"we":[34,138,149,157,224,248,251,279],"propose":[35,145],"a":[36,64,105,120,140,146],"novel":[37],"means":[38,121],"dramatically":[40],"efficiency":[44,131],"these":[46,237],"devices,":[47],"popular":[50],"type":[51],"applications.":[53],"The":[54],"main":[55],"hurdle":[56],"in":[57,70,170,212,236,294],"doing":[58],"so":[59,94],"that":[61,96,226,250,258,281],"GPUs":[62],"require":[63],"amount":[66],"bandwidth":[69,185,288],"order":[71,126],"fetch":[73],"all":[74],"necessary":[76],"textures":[77,101],"from":[78],"memory.":[79],"Although":[80],"consecutive":[81,166,180,204],"frames":[82,167,181],"tend":[83],"operate":[85],"on":[86],"same":[88],"textures,":[89],"re-use":[91],"distances":[92],"are":[93,168],"big":[95],"caches":[99],"fetching":[100],"appears":[102],"be":[104,199],"streaming":[106],"operation.":[107],"Traditional":[108],"designs":[109],"improve":[110],"degree":[112,176],"multi-threading":[114],"bandwidth,":[118],"as":[119,232],"performance.":[124],"meet":[128],"standards":[132],"required":[133],"by":[134,186,266],"mobile":[136],"market,":[137],"need":[139],"different":[141],"approach.":[142],"We":[143],"thus":[144,270],"technique":[147],"which":[148],"term":[150],"Parallel":[151],"Frame":[152],"Rendering":[153],"(PFR).":[154],"Under":[155],"PFR,":[156],"split":[158],"GPU":[160],"into":[161],"two":[162,165,203],"clusters":[163],"where":[164],"rendered":[169],"parallel.":[171],"PFR":[172,218,257,282],"exploits":[173],"high":[175],"similarity":[178],"between":[179],"save":[183],"texture":[188],"locality.":[189],"Since":[190],"physics":[192],"part":[193],"rendering":[196],"has":[197],"computed":[200],"sequentially":[201],"frames,":[205],"naturally":[207],"leads":[208],"an":[210,230],"increase":[211],"input":[214],"delay":[215],"latency":[216],"compared":[219],"with":[220,290],"traditional":[221],"systems.":[222,246],"However":[223],"argue":[225],"rarely":[229],"issue,":[231],"user":[234,274],"interface":[235],"devices":[238],"much":[240],"slower":[241],"than":[242],"those":[243],"desktop":[245],"Moreover,":[247],"show":[249,280],"can":[252,283],"reactive":[254],"forms":[255],"allow":[259],"us":[260],"bound":[262],"lag":[264],"observed":[265],"end":[268],"user,":[269],"maintaining":[271],"highest":[273],"experience":[275],"when":[276],"necessary.":[277],"Overall":[278],"achieve":[284],"28%":[285],"savings":[289],"only":[291],"minimal":[292],"loss":[293],"system":[295],"responsiveness.":[296]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":18},{"year":2017,"cited_by_count":13},{"year":2016,"cited_by_count":15},{"year":2015,"cited_by_count":14},{"year":2014,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
