{"id":"https://openalex.org/W4404133870","doi":"https://doi.org/10.1145/3649329.3655982","title":"TSAcc: An Efficient \\underline{T}empo-\\underline{S}patial Similarity Aware \\underline{Acc}elerator for Attention Acceleration","display_name":"TSAcc: An Efficient \\underline{T}empo-\\underline{S}patial Similarity Aware \\underline{Acc}elerator for Attention Acceleration","publication_year":2024,"publication_date":"2024-06-23","ids":{"openalex":"https://openalex.org/W4404133870","doi":"https://doi.org/10.1145/3649329.3655982"},"language":"en","primary_location":{"id":"doi:10.1145/3649329.3655982","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3649329.3655982","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 61st ACM/IEEE Design Automation Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067161373","display_name":"Zhuoran Song","orcid":"https://orcid.org/0000-0002-6494-4786"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuoran Song","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-6494-4786","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051407403","display_name":"Chunyu Qi","orcid":"https://orcid.org/0009-0004-9814-2468"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunyu Qi","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0004-9814-2468","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102415375","display_name":"Yiyun Yao","orcid":"https://orcid.org/0009-0001-0852-3784"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanzheng Yao","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0001-0852-3784","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103090571","display_name":"Peng Zhou","orcid":"https://orcid.org/0009-0000-0869-9782"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Zhou","raw_affiliation_strings":["Alibaba Cloud, Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0000-0869-9782","affiliations":[{"raw_affiliation_string":"Alibaba Cloud, Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114554077","display_name":"Yanyi Zi","orcid":"https://orcid.org/0009-0000-6936-3908"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanyi Zi","raw_affiliation_strings":["Alibaba Cloud, Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0000-6936-3908","affiliations":[{"raw_affiliation_string":"Alibaba Cloud, Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101816252","display_name":"Nan Wang","orcid":"https://orcid.org/0009-0002-8276-1868"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nan Wang","raw_affiliation_strings":["Alibaba Cloud, Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0002-8276-1868","affiliations":[{"raw_affiliation_string":"Alibaba Cloud, Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056632010","display_name":"Xiaoyao Liang","orcid":"https://orcid.org/0000-0002-2790-5884"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyao Liang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-2790-5884","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.485,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.82860208,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10241","display_name":"Functional Brain Connectivity Studies","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6559933423995972},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.6447682976722717},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5129032135009766},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29138004779815674},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.1851087510585785}],"concepts":[{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6559933423995972},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.6447682976722717},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5129032135009766},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29138004779815674},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.1851087510585785},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3649329.3655982","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3649329.3655982","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 61st ACM/IEEE Design Automation Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W2093762675","https://openalex.org/W2725159389","https://openalex.org/W2946794439","https://openalex.org/W3131922516","https://openalex.org/W4214686755"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Attention-based":[0],"models":[1],"provide":[2],"significant":[3],"accuracy":[4,193],"improvement":[5],"to":[6,28,77,85,103,138,159,167,183],"Natural":[7],"Language":[8],"Processing":[9],"(NLP)":[10],"and":[11,22,48,126,156,179,188],"computer":[12],"vision":[13],"(CV)":[14],"fields":[15],"at":[16],"the":[17,30,50,53,64,71,93,118,142,161,165],"cost":[18],"of":[19],"heavy":[20],"computational":[21,162],"memory":[23],"demands.":[24],"Previous":[25],"works":[26],"seek":[27],"alleviate":[29],"performance":[31],"bottleneck":[32],"by":[33,62,130],"removing":[34],"useless":[35],"relations":[36],"for":[37],"each":[38],"position.":[39],"However,":[40],"their":[41,128],"attempts":[42],"only":[43],"focus":[44],"on":[45,120],"intra-sentence":[46],"optimization":[47],"overlook":[49],"opportunity":[51],"in":[52,92,123,135,164],"temporal":[54],"domain.":[55],"In":[56],"this":[57],"paper,":[58],"we":[59,115,145],"accelerate":[60],"attention":[61],"leveraging":[63],"tempo-spatial":[65],"similarity":[66],"across":[67],"successive":[68,74],"sentences,":[69],"given":[70],"observation":[72],"that":[73,114,151,172],"sentences":[75,125,137],"tend":[76],"bear":[78],"high":[79],"similarity.":[80],"This":[81],"is":[82],"rational":[83],"owing":[84],"many":[86],"semantic":[87],"similar":[88,105,121],"words":[89],"(namely":[90],"tokens)":[91],"attention-based":[94],"models.":[95],"We":[96,107],"first":[97],"propose":[98,146],"an":[99],"online-offline":[100],"prediction":[101,154],"algorithm":[102,112,166],"identify":[104],"tokens/heads.":[106],"then":[108],"design":[109],"a":[110,147,153],"recovery":[111,157],"so":[113],"can":[116,174],"skip":[117],"computation":[119],"tokens/heads":[122,133],"succeeding":[124],"recover":[127],"results":[129],"copying":[131],"other":[132],"features":[134],"preceding":[136],"reserve":[139],"accuracy.":[140],"From":[141],"hardware":[143],"aspect,":[144],"specialized":[148],"architecture":[149],"TSAcc":[150,173],"includes":[152],"engine":[155,158],"translate":[160],"saving":[163],"real":[168],"speedup.":[169],"Experiments":[170],"show":[171],"achieve":[175],"8.5X,":[176],"2.7X,":[177],"14.1X,":[178],"64.9X":[180],"speedup":[181],"compared":[182],"SpAtten,":[184],"Sanger,":[185],"1080TI":[186],"GPU,":[187],"Xeon":[189],"CPU,":[190],"with":[191],"negligible":[192],"loss.":[194]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
