{"id":"https://openalex.org/W7133516902","doi":"https://doi.org/10.1109/hpca68181.2026.11408572","title":"TENET-v2: Applying Relation-Centric Notation to Model and Optimize Data Swizzle in the Cache of Modern NPU","display_name":"TENET-v2: Applying Relation-Centric Notation to Model and Optimize Data Swizzle in the Cache of Modern NPU","publication_year":2026,"publication_date":"2026-01-31","ids":{"openalex":"https://openalex.org/W7133516902","doi":"https://doi.org/10.1109/hpca68181.2026.11408572"},"language":null,"primary_location":{"id":"doi:10.1109/hpca68181.2026.11408572","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca68181.2026.11408572","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102897644","display_name":"Hanyu Zhang","orcid":"https://orcid.org/0009-0007-6860-9006"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hanyu Zhang","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128097207","display_name":"Fangxu Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fangxu Guo","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128056124","display_name":"Liqiang Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liqiang Lu","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039807594","display_name":"Long Wang","orcid":"https://orcid.org/0009-0004-1638-5993"},"institutions":[{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Long Wang","raw_affiliation_strings":["Huawei Technologies Co., Ltd"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Co., Ltd","institution_ids":["https://openalex.org/I4210160618"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101868264","display_name":"Yunfei Du","orcid":null},"institutions":[{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yunfei Du","raw_affiliation_strings":["Huawei Technologies Co., Ltd"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Co., Ltd","institution_ids":["https://openalex.org/I4210160618"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128044975","display_name":"Zhe Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhe Wang","raw_affiliation_strings":["Huawei Technologies Co., Ltd"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Co., Ltd","institution_ids":["https://openalex.org/I4210160618"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jinghan Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]},{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN","GB"],"is_corresponding":false,"raw_author_name":"Jinghan Zhang","raw_affiliation_strings":["Huawei Technologies Co., Ltd","Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Co., Ltd","institution_ids":["https://openalex.org/I4210160618"]},{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128051093","display_name":"Jie Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]},{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN","GB"],"is_corresponding":false,"raw_author_name":"Jie Zhang","raw_affiliation_strings":["Huawei Technologies Co., Ltd","Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Co., Ltd","institution_ids":["https://openalex.org/I4210160618"]},{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127894039","display_name":"Chenli Xue","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenli Xue","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065671838","display_name":"Chengpeng Wu","orcid":"https://orcid.org/0000-0002-4123-639X"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengpeng Wu","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128054169","display_name":"Ziyi Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziyi Zhang","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128098635","display_name":"Yun Liang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun Liang","raw_affiliation_strings":["Peking University"],"affiliations":[{"raw_affiliation_string":"Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072186367","display_name":"Size Zheng","orcid":"https://orcid.org/0000-0002-9471-1780"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Size Zheng","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5128081176","display_name":"Jianwei Yin","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianwei Yin","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5102897644"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.50110145,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"15"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.028999999165534973,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.028999999165534973,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.02199999988079071,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13650","display_name":"Computational Physics and Python Applications","score":0.01889999955892563,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.4740999937057495},{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.3587000072002411},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.262800008058548},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.2547000050544739}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7716000080108643},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.4740999937057495},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4480000138282776},{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.3587000072002411},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.29600000381469727},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.2815000116825104},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.28119999170303345},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.27459999918937683},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.262800008058548},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca68181.2026.11408572","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca68181.2026.11408572","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1519538706","https://openalex.org/W2048266589","https://openalex.org/W2096949479","https://openalex.org/W2119766542","https://openalex.org/W2194775991","https://openalex.org/W2328769609","https://openalex.org/W2612148068","https://openalex.org/W2940862705","https://openalex.org/W2949967139","https://openalex.org/W2954478959","https://openalex.org/W2954698171","https://openalex.org/W2980104813","https://openalex.org/W2980113464","https://openalex.org/W2985039650","https://openalex.org/W3016542674","https://openalex.org/W3097777922","https://openalex.org/W3102510044","https://openalex.org/W3103168911","https://openalex.org/W3123054690","https://openalex.org/W3130920634","https://openalex.org/W3155922894","https://openalex.org/W3157657667","https://openalex.org/W3158831985","https://openalex.org/W3177452048","https://openalex.org/W3187498994","https://openalex.org/W3190092209","https://openalex.org/W3211490618","https://openalex.org/W4221089937","https://openalex.org/W4288083528","https://openalex.org/W4312639064","https://openalex.org/W4321446237","https://openalex.org/W4327930477","https://openalex.org/W4389500318","https://openalex.org/W4401212175","https://openalex.org/W4404955793"],"related_works":[],"abstract_inverted_index":{"Swizzle":[0],"is":[1],"a":[2,53,62,79,107,150],"data":[3],"access":[4,69],"pattern":[5],"optimization":[6,27,179],"technique":[7],"by":[8,162],"reorganizing":[9],"the":[10,18],"execution":[11],"order":[12],"of":[13,137,152],"computational":[14],"tasks":[15],"to":[16,38,65,94,116,145,164],"improve":[17],"cache":[19,41,68,84,96,101,119,123,177],"locality":[20],"in":[21,140],"modern":[22],"NPUs.":[23],"Existing":[24],"analysis":[25],"and":[26,36,57,105],"techniques":[28],"lack":[29],"support":[30],"for":[31,55,83],"swizzleaware":[32],"modeling":[33,56],"on":[34,149,170,181],"NPUs":[35],"fail":[37],"effectively":[39],"capture":[40],"behavior":[42,98,120],"across":[43],"diverse":[44],"swizzle":[45,74],"configurations.":[46],"To":[47],"this":[48],"end,":[49],"we":[50,77],"propose":[51,78],"TENET-v2,":[52],"framework":[54],"optimizing":[58],"swizzle.":[59],"We":[60,173],"introduce":[61],"relation-centric":[63],"notation":[64],"characterize":[66],"different":[67],"patterns,":[70],"thus":[71],"exploring":[72],"wider":[73],"space.":[75],"Then,":[76],"hybrid":[80],"performance":[81,88],"model":[82,89,118],"analysis.":[85],"The":[86],"proposed":[87],"uses":[90],"an":[91,112,133],"analytical":[92],"approach":[93],"quantify":[95],"miss":[97],"under":[99,121],"unsaturated":[100],"conditions":[102,124],"(non-saturated":[103],"misses),":[104],"employs":[106],"simulation":[108],"method":[109],"combined":[110],"with":[111],"early":[113],"exiting":[114],"mechanism":[115],"rapidly":[117],"saturated":[122],"(saturated":[125],"misses).":[126],"Experimental":[127],"evaluations":[128],"demonstrate":[129,175],"that":[130,155],"TENET-v2":[131,156],"achieves":[132],"average":[134],"absolute":[135],"error":[136],"1.05":[138],"%":[139],"read":[141],"hit":[142],"rate":[143],"compared":[144],"real-world":[146],"hardware.":[147],"Evaluation":[148],"variety":[151],"DNNs":[153],"shows":[154],"outperforms":[157],"existing":[158],"tensor":[159],"program":[160],"optimizers":[161],"up":[163],"<tex":[165],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[166],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathbf{1.":[167],"5}":[168],"\\times$</tex>":[169],"A100":[171],"GPUs.":[172],"also":[174],"NPU":[176],"size":[178],"based":[180],"TENET-v2.":[182]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-03-05T00:00:00"}
