{"id":"https://openalex.org/W4414197012","doi":"https://doi.org/10.1109/dac63849.2025.11132440","title":"Buffer Prospector: Discovering and Exploiting Untapped Buffer Resources in Many-Core DNN Accelerators","display_name":"Buffer Prospector: Discovering and Exploiting Untapped Buffer Resources in Many-Core DNN Accelerators","publication_year":2025,"publication_date":"2025-06-22","ids":{"openalex":"https://openalex.org/W4414197012","doi":"https://doi.org/10.1109/dac63849.2025.11132440"},"language":"en","primary_location":{"id":"doi:10.1109/dac63849.2025.11132440","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dac63849.2025.11132440","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 62nd ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010247448","display_name":"Yuchen Wei","orcid":"https://orcid.org/0009-0003-5752-5422"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuchen Wei","raw_affiliation_strings":["Tsinghua Univeristy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua Univeristy","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001158014","display_name":"Jingwei Cai","orcid":"https://orcid.org/0009-0003-7560-8141"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingwei Cai","raw_affiliation_strings":["Tsinghua Univeristy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua Univeristy","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026297396","display_name":"Mingyu Gao","orcid":"https://orcid.org/0000-0001-8433-7281"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingyu Gao","raw_affiliation_strings":["Tsinghua Univeristy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua Univeristy","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102847848","display_name":"Sen Peng","orcid":"https://orcid.org/0009-0002-5312-2557"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sen Peng","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087025919","display_name":"Zuotong Wu","orcid":"https://orcid.org/0009-0000-1368-661X"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zuotong Wu","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101248909","display_name":"Guiming Shi","orcid":"https://orcid.org/0009-0003-0663-0863"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guiming Shi","raw_affiliation_strings":["Tsinghua Univeristy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua Univeristy","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006570986","display_name":"Kaisheng Ma","orcid":"https://orcid.org/0000-0001-9226-3366"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaisheng Ma","raw_affiliation_strings":["Tsinghua Univeristy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua Univeristy","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0704,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.79984163,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9804999828338623,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9804999828338623,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11216","display_name":"Radiation Detection and Scintillator Technologies","score":0.9722999930381775,"subfield":{"id":"https://openalex.org/subfields/3108","display_name":"Radiation"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11005","display_name":"Radiation Effects in Electronics","score":0.9452000260353088,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/buffer","display_name":"Buffer (optical fiber)","score":0.8427000045776367},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6370999813079834},{"id":"https://openalex.org/keywords/calculator","display_name":"Calculator","score":0.5382999777793884},{"id":"https://openalex.org/keywords/buffer-zone","display_name":"Buffer zone","score":0.45419999957084656},{"id":"https://openalex.org/keywords/buffer-overflow","display_name":"Buffer overflow","score":0.44620001316070557},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.4207000136375427}],"concepts":[{"id":"https://openalex.org/C145018004","wikidata":"https://www.wikidata.org/wiki/Q4985944","display_name":"Buffer (optical fiber)","level":2,"score":0.8427000045776367},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7208999991416931},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6370999813079834},{"id":"https://openalex.org/C2776836400","wikidata":"https://www.wikidata.org/wiki/Q31087","display_name":"Calculator","level":2,"score":0.5382999777793884},{"id":"https://openalex.org/C2778043458","wikidata":"https://www.wikidata.org/wiki/Q1054581","display_name":"Buffer zone","level":2,"score":0.45419999957084656},{"id":"https://openalex.org/C40842320","wikidata":"https://www.wikidata.org/wiki/Q19423","display_name":"Buffer overflow","level":2,"score":0.44620001316070557},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.4207000136375427},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.396699994802475},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.31279999017715454},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.27799999713897705},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.272599995136261},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26159998774528503},{"id":"https://openalex.org/C2984074130","wikidata":"https://www.wikidata.org/wiki/Q73539779","display_name":"R package","level":2,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dac63849.2025.11132440","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dac63849.2025.11132440","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 62nd ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2097117768","https://openalex.org/W2194775991","https://openalex.org/W2935331687","https://openalex.org/W2940862705","https://openalex.org/W2963446712","https://openalex.org/W2980104813","https://openalex.org/W2980200167","https://openalex.org/W3135242540","https://openalex.org/W3187498994","https://openalex.org/W3211226062","https://openalex.org/W4243674899","https://openalex.org/W4288083528","https://openalex.org/W4297097426","https://openalex.org/W4380881063","https://openalex.org/W4385245566","https://openalex.org/W4393592481","https://openalex.org/W4401211704","https://openalex.org/W4409248516"],"related_works":[],"abstract_inverted_index":{"In":[0],"large-scale":[1],"DNN":[2],"inference":[3],"accelerators,":[4],"the":[5,87,97],"many-core":[6,41],"architecture":[7,127],"has":[8],"emerged":[9],"as":[10],"a":[11,19,31,43,63,73,107],"predominant":[12],"design,":[13],"with":[14],"layer-pipeline":[15,38],"(LP)":[16],"mapping":[17,21,39,102],"being":[18],"mainstream":[20],"approach.":[22],"However,":[23],"our":[24],"experimental":[25],"findings":[26],"and":[27,33,65,77,113,117,128],"theoretical":[28],"justifications":[29],"uncover":[30],"hardware-independent":[32],"prevalent":[34],"flaw":[35],"in":[36,92,110],"employing":[37],"on":[40,58,82,126],"accelerators:":[42],"significant":[44],"underutilization":[45],"of":[46],"buffer":[47,67],"space":[48],"across":[49],"numerous":[50],"cores,":[51],"indicating":[52],"substantial":[53],"potential":[54],"for":[55],"optimization.":[56],"Building":[57],"this":[59],"discovery,":[60],"we":[61,121],"develop":[62],"universal":[64],"efficient":[66],"allocation":[68],"strategy,":[69],"BufferProspector,":[70],"which":[71],"includes":[72],"Buffer":[74,78],"Requirement":[75],"Calculator":[76],"Allocator,":[79],"to":[80,96],"capitalize":[81],"these":[83],"unused":[84],"buffers,":[85],"addressing":[86],"timing":[88],"mismatch":[89],"challenge":[90],"inherent":[91],"LP":[93,101],"mapping.":[94,129],"Compared":[95],"state-of-the-art":[98],"(SOTA)":[99],"open-source":[100],"framework":[103],"Tangram,":[104],"BufferProspector":[105,130],"averages":[106],"simultaneous":[108],"increase":[109],"energy":[111],"efficiency":[112],"performance":[114],"by":[115],"1.44\u00d7":[116],"2.26\u00d7,":[118],"respectively.":[119],"Moreover,":[120],"conduct":[122],"some":[123],"case":[124],"studies":[125],"will":[131],"be":[132],"open-sourced.":[133]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
