{"id":"https://openalex.org/W4360831786","doi":"https://doi.org/10.1109/hpca56546.2023.10071047","title":"HeatViT: Hardware-Efficient Adaptive Token Pruning for Vision Transformers","display_name":"HeatViT: Hardware-Efficient Adaptive Token Pruning for Vision Transformers","publication_year":2023,"publication_date":"2023-02-01","ids":{"openalex":"https://openalex.org/W4360831786","doi":"https://doi.org/10.1109/hpca56546.2023.10071047"},"language":"en","primary_location":{"id":"doi:10.1109/hpca56546.2023.10071047","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca56546.2023.10071047","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Symposium on High-Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089349472","display_name":"Peiyan Dong","orcid":"https://orcid.org/0000-0001-5287-5149"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":true,"raw_author_name":"Peiyan Dong","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083232044","display_name":"Mengshu Sun","orcid":"https://orcid.org/0000-0003-3540-1464"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Mengshu Sun","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067662998","display_name":"Alec Lu","orcid":"https://orcid.org/0000-0002-3315-7368"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Alec Lu","raw_affiliation_strings":["Simon Fraser University"],"affiliations":[{"raw_affiliation_string":"Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088784101","display_name":"Yanyue Xie","orcid":"https://orcid.org/0000-0002-4325-521X"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Yanyue Xie","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004089365","display_name":"Kenneth Liu","orcid":"https://orcid.org/0009-0002-1348-6583"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Kenneth Liu","raw_affiliation_strings":["Simon Fraser University"],"affiliations":[{"raw_affiliation_string":"Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078971265","display_name":"Zhenglun Kong","orcid":"https://orcid.org/0000-0002-8120-4456"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Zhenglun Kong","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101543801","display_name":"Xin Meng","orcid":"https://orcid.org/0000-0003-1376-0917"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Xin Meng","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101633365","display_name":"Zhengang Li","orcid":"https://orcid.org/0000-0001-6644-4761"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Zhengang Li","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101695981","display_name":"Xue Lin","orcid":"https://orcid.org/0000-0002-3088-2767"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Xue Lin","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065889904","display_name":"Zhenman Fang","orcid":"https://orcid.org/0000-0003-0603-9697"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Zhenman Fang","raw_affiliation_strings":["Simon Fraser University"],"affiliations":[{"raw_affiliation_string":"Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100651384","display_name":"Yanzhi Wang","orcid":"https://orcid.org/0000-0002-3024-7990"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Yanzhi Wang","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5089349472"],"corresponding_institution_ids":["https://openalex.org/I87182695"],"apc_list":null,"apc_paid":null,"fwci":11.8687,"has_fulltext":false,"cited_by_count":91,"citation_normalized_percentile":{"value":0.99131733,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"442","last_page":"455"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7950792908668518},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.6913418769836426},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.646964430809021},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.6000881195068359},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5793046355247498},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.5525076389312744},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5411062240600586},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.5255944728851318},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.35092607140541077},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.34731703996658325},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3309670686721802},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.21794140338897705}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7950792908668518},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.6913418769836426},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.646964430809021},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.6000881195068359},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5793046355247498},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.5525076389312744},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5411062240600586},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.5255944728851318},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.35092607140541077},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.34731703996658325},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3309670686721802},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.21794140338897705},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca56546.2023.10071047","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca56546.2023.10071047","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Symposium on High-Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W398859631","https://openalex.org/W569478347","https://openalex.org/W1969733464","https://openalex.org/W2105482032","https://openalex.org/W2413794162","https://openalex.org/W2752782242","https://openalex.org/W2792643794","https://openalex.org/W2896457183","https://openalex.org/W2896983500","https://openalex.org/W2899663614","https://openalex.org/W2952122856","https://openalex.org/W2963150697","https://openalex.org/W2963351113","https://openalex.org/W2965942869","https://openalex.org/W2970896726","https://openalex.org/W2982083293","https://openalex.org/W3003315945","https://openalex.org/W3035251378","https://openalex.org/W3047848469","https://openalex.org/W3094349784","https://openalex.org/W3096609285","https://openalex.org/W3098873988","https://openalex.org/W3121523901","https://openalex.org/W3131500599","https://openalex.org/W3133696297","https://openalex.org/W3139445856","https://openalex.org/W3168114581","https://openalex.org/W3168124404","https://openalex.org/W3169769781","https://openalex.org/W3170233084","https://openalex.org/W3170841864","https://openalex.org/W3171125843","https://openalex.org/W3172801447","https://openalex.org/W3174402370","https://openalex.org/W3176468986","https://openalex.org/W3177183540","https://openalex.org/W3185102306","https://openalex.org/W3188427387","https://openalex.org/W3199934250","https://openalex.org/W3202742610","https://openalex.org/W3204801262","https://openalex.org/W3211787299","https://openalex.org/W3214835194","https://openalex.org/W4211085526","https://openalex.org/W4214493665","https://openalex.org/W4214636423","https://openalex.org/W4292779060","https://openalex.org/W4312340826","https://openalex.org/W4312872526","https://openalex.org/W4312910119","https://openalex.org/W4321232185","https://openalex.org/W4321637298","https://openalex.org/W4365446402","https://openalex.org/W4385245566","https://openalex.org/W6758657797","https://openalex.org/W6761472960","https://openalex.org/W6767025246","https://openalex.org/W6778883912","https://openalex.org/W6784094891","https://openalex.org/W6784333009","https://openalex.org/W6788135285","https://openalex.org/W6790690058","https://openalex.org/W6793979934","https://openalex.org/W6796494063","https://openalex.org/W6796580215","https://openalex.org/W6796617330","https://openalex.org/W6797478244","https://openalex.org/W6797854001","https://openalex.org/W6803469875","https://openalex.org/W6810818354"],"related_works":["https://openalex.org/W2532502681","https://openalex.org/W3183118997","https://openalex.org/W3214410901","https://openalex.org/W3204400881","https://openalex.org/W3204296682","https://openalex.org/W2917767146","https://openalex.org/W4319952061","https://openalex.org/W4280636456","https://openalex.org/W4388913998","https://openalex.org/W4310584535"],"abstract_inverted_index":{"While":[0],"vision":[1],"transformers":[2],"(ViTs)":[3],"have":[4,25],"continuously":[5],"achieved":[6],"new":[7],"milestones":[8],"in":[9,61,144],"the":[10,57,87,96,114,119,139,153,167,194,199,208],"field":[11],"of":[12,205,221],"computer":[13],"vision,":[14],"their":[15,27],"sophisticated":[16],"network":[17],"architectures":[18],"with":[19,132,215],"high":[20],"computation":[21,155,179],"and":[22,69,85,128,191,225],"memory":[23],"costs":[24],"impeded":[26],"deployment":[28],"on":[29,52,56,99,135,193,207],"resource-limited":[30],"edge":[31],"devices.":[32],"In":[33],"this":[34],"paper,":[35],"we":[36,63,94,122],"propose":[37,129],"a":[38,216],"hardware-efficient":[39],"image-adaptive":[40],"token":[41,72,97],"pruning":[42,150],"framework":[43],"called":[44],"HeatViT":[45,157,171,206],"for":[46,113,138,181],"efficient":[47],"yet":[48],"accurate":[49],"ViT":[50,149],"acceleration":[51],"embedded":[53],"FPGAs.":[54],"Based":[55],"inherent":[58],"computational":[59],"patterns":[60],"ViTs,":[62,185],"first":[64],"adopt":[65],"an":[66],"effective,":[67],"hardware-efficient,":[68],"learnable":[70],"head-evaluation":[71],"selector,":[73],"which":[74],"can":[75,158,172],"be":[76],"progressively":[77],"inserted":[78],"before":[79],"transformer":[80],"blocks":[81],"to":[82,106,147,198],"dynamically":[83],"identify":[84],"consolidate":[86],"non-informative":[88],"tokens":[89],"from":[90],"input":[91],"images.":[92],"Moreover,":[93],"implement":[95],"selector":[98],"hardware":[100,110,120,201],"by":[101],"adding":[102],"miniature":[103],"control":[104],"logic":[105],"heavily":[107],"reuse":[108],"existing":[109,148],"components":[111],"built":[112],"backbone":[115],"ViT.":[116],"To":[117],"improve":[118],"efficiency,":[121],"further":[123],"employ":[124],"8-bit":[125],"fixed-point":[126],"quantization":[127,136],"polynomial":[130],"approximations":[131],"regularization":[133],"effect":[134],"error":[137],"frequently":[140],"used":[141,184],"nonlinear":[142],"functions":[143],"ViTs.":[145],"Compared":[146,197],"studies,":[151],"under":[152,166],"similar":[154,168],"cost,":[156],"achieve":[159,173,212],"0.7%":[160],"~":[161,177],"8.9%":[162],"higher":[163],"accuracy;":[164],"while":[165],"model":[169],"accuracy,":[170],"more":[174,223,227],"than":[175],"28.4%":[176],"65.3%":[178],"reduction,":[180],"various":[182],"widely":[183],"including":[186],"DeiT-T,":[187],"DeiT-S,":[188],"DeiT-B,":[189],"LV-ViT-S,":[190],"LV-ViT-M,":[192],"ImageNet":[195],"dataset.":[196],"baseline":[200],"accelerator,":[202],"our":[203],"implementations":[204],"Xilinx":[209],"ZCU102":[210],"FPGA":[211],"3.46\u00d7~4.89\u00d7":[213],"speedup":[214],"trivial":[217],"resource":[218],"utilization":[219],"overhead":[220],"8%~11%":[222],"DSPs":[224],"5%~8%":[226],"LUTs.":[228]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":52},{"year":2024,"cited_by_count":28},{"year":2023,"cited_by_count":7}],"updated_date":"2026-03-28T08:17:26.163206","created_date":"2025-10-10T00:00:00"}
