{"id":"https://openalex.org/W2527855935","doi":"https://doi.org/10.1109/iiswc.2016.7581276","title":"ID-cache: instruction and memory divergence based cache management for GPUs","display_name":"ID-cache: instruction and memory divergence based cache management for GPUs","publication_year":2016,"publication_date":"2016-09-01","ids":{"openalex":"https://openalex.org/W2527855935","doi":"https://doi.org/10.1109/iiswc.2016.7581276","mag":"2527855935"},"language":"en","primary_location":{"id":"doi:10.1109/iiswc.2016.7581276","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iiswc.2016.7581276","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Symposium on Workload Characterization (IISWC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087438386","display_name":"Akhil Arunkumar","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Akhil Arunkumar","raw_affiliation_strings":["School of Computing, Arizona State University"],"affiliations":[{"raw_affiliation_string":"School of Computing, Arizona State University","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075111485","display_name":"Shin-Ying Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shin-ying Lee","raw_affiliation_strings":["School of Computing, Arizona State University"],"affiliations":[{"raw_affiliation_string":"School of Computing, Arizona State University","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028220093","display_name":"Carole-Jean Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Carole-jean Wu","raw_affiliation_strings":["School of Computing, Arizona State University"],"affiliations":[{"raw_affiliation_string":"School of Computing, Arizona State University","institution_ids":["https://openalex.org/I55732556"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5087438386"],"corresponding_institution_ids":["https://openalex.org/I55732556"],"apc_list":null,"apc_paid":null,"fwci":2.2073,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.87380102,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8662629127502441},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.7631872296333313},{"id":"https://openalex.org/keywords/cache-coloring","display_name":"Cache coloring","score":0.7111712098121643},{"id":"https://openalex.org/keywords/cache-pollution","display_name":"Cache pollution","score":0.6993506550788879},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6963647603988647},{"id":"https://openalex.org/keywords/cache-algorithms","display_name":"Cache algorithms","score":0.5827368497848511},{"id":"https://openalex.org/keywords/page-cache","display_name":"Page cache","score":0.5318094491958618},{"id":"https://openalex.org/keywords/smart-cache","display_name":"Smart Cache","score":0.5201318860054016},{"id":"https://openalex.org/keywords/memory-bandwidth","display_name":"Memory bandwidth","score":0.44199663400650024},{"id":"https://openalex.org/keywords/cache-invalidation","display_name":"Cache invalidation","score":0.42834970355033875},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.342426598072052},{"id":"https://openalex.org/keywords/cpu-cache","display_name":"CPU cache","score":0.3279768228530884}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8662629127502441},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.7631872296333313},{"id":"https://openalex.org/C201148951","wikidata":"https://www.wikidata.org/wiki/Q5015976","display_name":"Cache coloring","level":4,"score":0.7111712098121643},{"id":"https://openalex.org/C113166858","wikidata":"https://www.wikidata.org/wiki/Q5015981","display_name":"Cache pollution","level":5,"score":0.6993506550788879},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6963647603988647},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.5827368497848511},{"id":"https://openalex.org/C36340418","wikidata":"https://www.wikidata.org/wiki/Q7124288","display_name":"Page cache","level":5,"score":0.5318094491958618},{"id":"https://openalex.org/C167713795","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"Smart Cache","level":5,"score":0.5201318860054016},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.44199663400650024},{"id":"https://openalex.org/C25536678","wikidata":"https://www.wikidata.org/wiki/Q5015977","display_name":"Cache invalidation","level":5,"score":0.42834970355033875},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.342426598072052},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.3279768228530884}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iiswc.2016.7581276","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iiswc.2016.7581276","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Symposium on Workload Characterization (IISWC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1968271929","https://openalex.org/W1979527452","https://openalex.org/W1982996921","https://openalex.org/W1989061323","https://openalex.org/W1999621870","https://openalex.org/W2020572638","https://openalex.org/W2021211271","https://openalex.org/W2027806965","https://openalex.org/W2047060659","https://openalex.org/W2060087084","https://openalex.org/W2062527253","https://openalex.org/W2065562952","https://openalex.org/W2067441262","https://openalex.org/W2078994750","https://openalex.org/W2080592089","https://openalex.org/W2081583983","https://openalex.org/W2084309410","https://openalex.org/W2091583059","https://openalex.org/W2092283255","https://openalex.org/W2095258606","https://openalex.org/W2106617337","https://openalex.org/W2129817042","https://openalex.org/W2149412112","https://openalex.org/W2152356827","https://openalex.org/W2157800896","https://openalex.org/W4237024478","https://openalex.org/W4244089596","https://openalex.org/W4248430743","https://openalex.org/W6673860370"],"related_works":["https://openalex.org/W2133489088","https://openalex.org/W2118932116","https://openalex.org/W2114386333","https://openalex.org/W2535115842","https://openalex.org/W2126408955","https://openalex.org/W2396934146","https://openalex.org/W2363769136","https://openalex.org/W2148571123","https://openalex.org/W2539712666","https://openalex.org/W2270982805"],"abstract_inverted_index":{"Modern":[0],"graphic":[1],"processing":[2],"units":[3],"(GPUs)":[4],"are":[5,37],"not":[6],"only":[7],"able":[8,176],"to":[9,52,122,140,177],"perform":[10,15],"graphics":[11],"rendering,":[12],"but":[13],"also":[14],"general":[16],"purpose":[17],"parallel":[18],"computations":[19],"(GPGPUs).":[20],"It":[21],"has":[22],"been":[23],"shown":[24],"that":[25,113,174],"the":[26,32,54,70,77,94,102,130,157],"GPU":[27],"L1":[28],"data":[29],"cache":[30,64,86,127,143,171,190],"and":[31,43,58,65,82,97,116,168,191],"on":[33,69,150,156],"chip":[34],"interconnect":[35,66,192],"bandwidth":[36,67],"important":[38],"sources":[39,55],"of":[40,56,79,85,104,145,181,189],"performance":[41,183],"bottlenecks":[42],"inefficiencies":[44,57],"in":[45],"GPGPUs.":[46],"Through":[47,107],"this":[48],"work,":[49],"we":[50,111,163],"aim":[51],"understand":[53],"possible":[59],"opportunities":[60],"for":[61,185],"more":[62],"efficient":[63],"management":[68,172],"GPUs.":[71],"We":[72],"do":[73],"so":[74],"by":[75],"understanding":[76],"predictability":[78],"reuse":[80,126],"behavior":[81,99],"spatial":[83,152],"utilization":[84],"lines":[87,128,144],"using":[88],"program":[89],"level":[90],"information":[91,135],"such":[92,100],"as":[93,101],"instruction":[95],"PC,":[96,115],"runtime":[98],"extent":[103],"memory":[105,117,133,169],"divergence.":[106],"our":[108,161],"characterization":[109],"results,":[110],"demonstrate":[112],"a)":[114],"divergence":[118,134],"can":[119,136],"be":[120,138],"used":[121,139],"efficiently":[123],"bypass":[124],"zero":[125],"from":[129],"cache;":[131],"b)":[132],"further":[137],"dynamically":[141],"insert":[142],"varying":[146],"size":[147],"granularities":[148],"based":[149,155],"their":[151],"utilization.":[153],"Finally,":[154],"insights":[158],"derived":[159],"through":[160],"characterization,":[162],"design":[164],"a":[165,186],"simple":[166],"Instruction":[167],"Divergence":[170],"method":[173],"is":[175],"achieve":[178],"an":[179],"average":[180],"71%":[182],"improvement":[184],"wide":[187],"variety":[188],"sensitive":[193],"applications.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":1}],"updated_date":"2026-01-28T23:14:49.684275","created_date":"2025-10-10T00:00:00"}
