{"id":"https://openalex.org/W2953836263","doi":"https://doi.org/10.1109/igcc.2018.8752137","title":"How Much Cache is Enough? A Cache Behavior Analysis for Machine Learning GPU Architectures","display_name":"How Much Cache is Enough? A Cache Behavior Analysis for Machine Learning GPU Architectures","publication_year":2018,"publication_date":"2018-10-01","ids":{"openalex":"https://openalex.org/W2953836263","doi":"https://doi.org/10.1109/igcc.2018.8752137","mag":"2953836263"},"language":"en","primary_location":{"id":"doi:10.1109/igcc.2018.8752137","is_oa":false,"landing_page_url":"https://doi.org/10.1109/igcc.2018.8752137","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 Ninth International Green and Sustainable Computing Conference (IGSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102940391","display_name":"Sonia Mart\u00edn L\u00f3pez","orcid":"https://orcid.org/0000-0002-4308-5572"},"institutions":[{"id":"https://openalex.org/I155173764","display_name":"Rochester Institute of Technology","ror":"https://ror.org/00v4yb702","country_code":"US","type":"education","lineage":["https://openalex.org/I155173764"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"S. Lopez","raw_affiliation_strings":["Computer Engineering Department, Rochester Institute of Technology, Rochester, NY"],"affiliations":[{"raw_affiliation_string":"Computer Engineering Department, Rochester Institute of Technology, Rochester, NY","institution_ids":["https://openalex.org/I155173764"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044858493","display_name":"Yash Nimkar","orcid":null},"institutions":[{"id":"https://openalex.org/I155173764","display_name":"Rochester Institute of Technology","ror":"https://ror.org/00v4yb702","country_code":"US","type":"education","lineage":["https://openalex.org/I155173764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Y. Nimkar","raw_affiliation_strings":["Computer Engineering Department, Rochester Institute of Technology, Rochester, NY"],"affiliations":[{"raw_affiliation_string":"Computer Engineering Department, Rochester Institute of Technology, Rochester, NY","institution_ids":["https://openalex.org/I155173764"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045350419","display_name":"Gerald Kotas","orcid":null},"institutions":[{"id":"https://openalex.org/I155173764","display_name":"Rochester Institute of Technology","ror":"https://ror.org/00v4yb702","country_code":"US","type":"education","lineage":["https://openalex.org/I155173764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"G. Kotas","raw_affiliation_strings":["Computer Engineering Department, Rochester Institute of Technology, Rochester, NY"],"affiliations":[{"raw_affiliation_string":"Computer Engineering Department, Rochester Institute of Technology, Rochester, NY","institution_ids":["https://openalex.org/I155173764"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102940391"],"corresponding_institution_ids":["https://openalex.org/I155173764"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.24945001,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8800029754638672},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.8447955846786499},{"id":"https://openalex.org/keywords/cache-pollution","display_name":"Cache pollution","score":0.7598984241485596},{"id":"https://openalex.org/keywords/cache-algorithms","display_name":"Cache algorithms","score":0.732582151889801},{"id":"https://openalex.org/keywords/cache-coloring","display_name":"Cache coloring","score":0.6762899160385132},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6757056713104248},{"id":"https://openalex.org/keywords/smart-cache","display_name":"Smart Cache","score":0.6144423484802246},{"id":"https://openalex.org/keywords/cache-invalidation","display_name":"Cache invalidation","score":0.5770590305328369},{"id":"https://openalex.org/keywords/memory-hierarchy","display_name":"Memory hierarchy","score":0.5696483254432678},{"id":"https://openalex.org/keywords/cache-oblivious-algorithm","display_name":"Cache-oblivious algorithm","score":0.5665019750595093},{"id":"https://openalex.org/keywords/page-cache","display_name":"Page cache","score":0.5455623269081116},{"id":"https://openalex.org/keywords/cpu-cache","display_name":"CPU cache","score":0.4326852858066559},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.34502702951431274}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8800029754638672},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.8447955846786499},{"id":"https://openalex.org/C113166858","wikidata":"https://www.wikidata.org/wiki/Q5015981","display_name":"Cache pollution","level":5,"score":0.7598984241485596},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.732582151889801},{"id":"https://openalex.org/C201148951","wikidata":"https://www.wikidata.org/wiki/Q5015976","display_name":"Cache coloring","level":4,"score":0.6762899160385132},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6757056713104248},{"id":"https://openalex.org/C167713795","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"Smart Cache","level":5,"score":0.6144423484802246},{"id":"https://openalex.org/C25536678","wikidata":"https://www.wikidata.org/wiki/Q5015977","display_name":"Cache invalidation","level":5,"score":0.5770590305328369},{"id":"https://openalex.org/C2778100165","wikidata":"https://www.wikidata.org/wiki/Q1589327","display_name":"Memory hierarchy","level":3,"score":0.5696483254432678},{"id":"https://openalex.org/C59687516","wikidata":"https://www.wikidata.org/wiki/Q5015938","display_name":"Cache-oblivious algorithm","level":5,"score":0.5665019750595093},{"id":"https://openalex.org/C36340418","wikidata":"https://www.wikidata.org/wiki/Q7124288","display_name":"Page cache","level":5,"score":0.5455623269081116},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.4326852858066559},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.34502702951431274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/igcc.2018.8752137","is_oa":false,"landing_page_url":"https://doi.org/10.1109/igcc.2018.8752137","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 Ninth International Green and Sustainable Computing Conference (IGSC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.8999999761581421,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W58105879","https://openalex.org/W2023062763","https://openalex.org/W2036953536","https://openalex.org/W2160428323","https://openalex.org/W2163687928","https://openalex.org/W2328929289","https://openalex.org/W2519021283","https://openalex.org/W2541463506","https://openalex.org/W2736244279","https://openalex.org/W2951075198"],"related_works":["https://openalex.org/W2098406302","https://openalex.org/W2535115842","https://openalex.org/W2734782074","https://openalex.org/W2546991807","https://openalex.org/W2020176098","https://openalex.org/W2076114130","https://openalex.org/W2121191383","https://openalex.org/W1584415117","https://openalex.org/W2500877097","https://openalex.org/W2436169747"],"abstract_inverted_index":{"Graphic":[0],"Processing":[1],"Units":[2],"(GPUs)":[3],"are":[4],"highly":[5],"parallel,":[6],"power":[7,127],"hungry":[8],"devices":[9],"with":[10,142],"large":[11,59],"numbers":[12],"of":[13,27,33,37,53,61,79,95,106,124,131,137],"transistors":[14,62],"devoted":[15,65],"to":[16,39,66],"the":[17,50,67,76,80,84,96,119,125,132,138,146],"cache":[18,68,81,98,116,140],"hierarchy.":[19,70],"Machine":[20,88],"learning":[21],"is":[22,49,63],"a":[23,58,102,114],"target":[24],"application":[25],"field":[26],"these":[28,56],"devices,":[29,57],"which":[30],"take":[31],"advantage":[32],"their":[34],"high":[35],"levels":[36],"parallelism":[38,48],"hide":[40],"long":[41],"latency":[42],"memory":[43,69],"access":[44,136],"dependencies.":[45],"Even":[46],"though":[47],"main":[51],"source":[52],"performance":[54],"in":[55,101,110,122],"number":[60,105],"still":[64],"Upon":[71],"detailed":[72],"analysis,":[73],"we":[74,91,112],"measure":[75],"real":[77],"impact":[78,144],"hierarchy":[82],"on":[83,145],"overall":[85,147],"performance.":[86,148],"Targeting":[87],"Learning":[89],"applications,":[90],"observed":[92],"that":[93],"most":[94],"successful":[97],"accesses":[99],"happen":[100],"very":[103],"reduced":[104],"blocks.":[107],"With":[108],"this":[109],"mind,":[111],"propose":[113],"different":[115],"configuration":[117],"for":[118],"GPU,":[120],"resulting":[121],"25%":[123],"leakage":[126],"consumption":[128],"and":[129],"10%":[130],"dynamic":[133],"energy":[134],"per":[135],"original":[139],"configuration,":[141],"minimal":[143]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
