{"id":"https://openalex.org/W4400726540","doi":"https://doi.org/10.1109/tcsi.2024.3426653","title":"BSViT: A Bit-Serial Vision Transformer Accelerator Exploiting Dynamic Patch and Weight Bit-Group Quantization","display_name":"BSViT: A Bit-Serial Vision Transformer Accelerator Exploiting Dynamic Patch and Weight Bit-Group Quantization","publication_year":2024,"publication_date":"2024-07-17","ids":{"openalex":"https://openalex.org/W4400726540","doi":"https://doi.org/10.1109/tcsi.2024.3426653"},"language":"en","primary_location":{"id":"doi:10.1109/tcsi.2024.3426653","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2024.3426653","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006070507","display_name":"Gang Wang","orcid":"https://orcid.org/0009-0003-6944-2958"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Gang Wang","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103263156","display_name":"Siqi Cai","orcid":"https://orcid.org/0000-0003-1478-2202"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siqi Cai","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100408977","display_name":"Wenjie Li","orcid":"https://orcid.org/0000-0002-1244-7657"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenjie Li","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066692868","display_name":"Dongxu Lyu","orcid":"https://orcid.org/0000-0001-6826-2670"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongxu Lyu","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054897331","display_name":"Guanghui He","orcid":"https://orcid.org/0000-0002-0486-6421"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanghui He","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering and the MoE Key Laboratory of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering and the MoE Key Laboratory of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5006070507"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":2.8877,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.91288474,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"71","issue":"9","first_page":"4064","last_page":"4077"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5541137456893921},{"id":"https://openalex.org/keywords/bit","display_name":"Bit (key)","score":0.553321897983551},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.512313961982727},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.48428934812545776},{"id":"https://openalex.org/keywords/electronic-engineering","display_name":"Electronic engineering","score":0.4163815379142761},{"id":"https://openalex.org/keywords/8-bit","display_name":"8-bit","score":0.41494816541671753},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.2988339960575104},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.29517874121665955},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.20478194952011108},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.18002471327781677},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.11661338806152344}],"concepts":[{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5541137456893921},{"id":"https://openalex.org/C117011727","wikidata":"https://www.wikidata.org/wiki/Q1278488","display_name":"Bit (key)","level":2,"score":0.553321897983551},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.512313961982727},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.48428934812545776},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.4163815379142761},{"id":"https://openalex.org/C187919765","wikidata":"https://www.wikidata.org/wiki/Q270159","display_name":"8-bit","level":2,"score":0.41494816541671753},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.2988339960575104},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.29517874121665955},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.20478194952011108},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.18002471327781677},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.11661338806152344},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsi.2024.3426653","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2024.3426653","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5739802379","display_name":null,"funder_award_id":"62074097","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2108598243","https://openalex.org/W2194775991","https://openalex.org/W3043504674","https://openalex.org/W3138516171","https://openalex.org/W4210396250","https://openalex.org/W4220865834","https://openalex.org/W4285507310","https://openalex.org/W4285601701","https://openalex.org/W4287118909","https://openalex.org/W4307934016","https://openalex.org/W4308479898","https://openalex.org/W4319996342","https://openalex.org/W4360831786","https://openalex.org/W4360831795","https://openalex.org/W4362500802","https://openalex.org/W4380881077","https://openalex.org/W4385216221","https://openalex.org/W4385216645","https://openalex.org/W4385245566","https://openalex.org/W4386306971","https://openalex.org/W4386765191","https://openalex.org/W4387042316","https://openalex.org/W4387789586","https://openalex.org/W4387789741","https://openalex.org/W4389166707","https://openalex.org/W4390190626","https://openalex.org/W4390356856","https://openalex.org/W4390873673","https://openalex.org/W4390874575","https://openalex.org/W4393406875","https://openalex.org/W6729126992","https://openalex.org/W6763456558","https://openalex.org/W6788135285","https://openalex.org/W6791353385","https://openalex.org/W6796815506","https://openalex.org/W6840088539","https://openalex.org/W6846164622"],"related_works":["https://openalex.org/W3149091528","https://openalex.org/W2028353274","https://openalex.org/W975020229","https://openalex.org/W2121145321","https://openalex.org/W1902169700","https://openalex.org/W2257409576","https://openalex.org/W2502671172","https://openalex.org/W2921226914","https://openalex.org/W3143808432","https://openalex.org/W2996053819"],"abstract_inverted_index":{"Vision":[0,45,60],"Transformers":[1],"(ViTs)":[2],"have":[3],"achieved":[4],"remarkable":[5],"success":[6],"in":[7],"computer":[8],"vision":[9],"(CV)":[10],"and":[11,58,76,105,127,149,154,166,204,220],"are":[12],"increasingly":[13],"recognized":[14],"as":[15],"the":[16,26,64,136,160,182],"new":[17],"backbone":[18],"for":[19],"vision-language":[20],"multi-modal":[21],"tasks.":[22],"Despite":[23],"their":[24,34,99],"success,":[25],"high":[27],"computational":[28],"cost":[29],"associated":[30],"with":[31],"ViTs":[32],"hinders":[33],"inference":[35],"efficiency.":[36],"In":[37],"this":[38],"paper,":[39],"we":[40,67,113,139],"introduce":[41,82,152],"BSViT,":[42],"a":[43,69,83,115,141],"bit-serial":[44,143,156,218],"Transformer":[46,61,236],"accelerator":[47,144],"enhanced":[48],"by":[49],"algorithm-hardware":[50],"co-design.":[51],"BSViT":[52,191],"can":[53,192],"efficiently":[54,146,180],"accelerate":[55],"both":[56],"plain":[57],"hierarchical":[59],"inference.":[62],"At":[63,135],"algorithm":[65],"level,":[66,138],"propose":[68,114,140],"post-training":[70],"quantization":[71,86,118],"scheme":[72,88,120],"named":[73],"dynamic":[74,84],"patch":[75,85],"weight":[77,116],"bit-group":[78,117],"quantization.":[79],"We":[80,151],"first":[81],"(DPQ)":[87],"to":[89,93,121,145,158,179,195,215,223,234],"dynamically":[90],"allocate":[91],"bit-width":[92],"different":[94],"image":[95],"patches":[96],"based":[97],"on":[98],"importance,":[100],"thus":[101],"reducing":[102],"bit":[103],"width":[104],"saving":[106],"computation":[107],"without":[108],"significantly":[109],"impacting":[110],"accuracy.":[111],"Second,":[112],"(BGQ)":[119],"evenly":[122],"distribute":[123],"bits":[124],"within":[125],"groups":[126],"achieve":[128,193,221],"workload":[129],"balance":[130,181],"across":[131],"processing":[132],"elements":[133],"(PEs).":[134],"hardware":[137],"term-separate":[142],"support":[147],"DPQ":[148],"BGQ.":[150],"dense":[153,161],"sparse":[155,167],"PEs":[157],"manipulate":[159],"least":[162],"significant":[163,169],"term":[164,170],"(LST)":[165],"most":[168],"(MST)":[171],"workloads.":[172,186],"A":[173],"dense-sparse":[174],"hybrid":[175],"dataflow":[176],"is":[177],"devised":[178],"two":[183],"kinds":[184],"of":[185],"Our":[187],"experiments":[188],"show":[189],"that":[190],"up":[194,222],"<inline-formula":[196,205,224],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[197,206,225],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[198,207,226],"<tex-math":[199,208,227],"notation=\"LaTeX\">$1.95\\times":[200],"$":[201,210,229],"</tex-math></inline-formula>":[202,211,230],"speedup":[203],"notation=\"LaTeX\">$2.72\\times":[209],"energy":[212,231],"efficiency":[213,232],"compared":[214,233],"state-of-the-art":[216],"(SOTA)":[217],"accelerators":[219],"notation=\"LaTeX\">$3.69\\times":[228],"SOTA":[235],"accelerators.":[237]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":12}],"updated_date":"2026-02-25T23:00:34.991745","created_date":"2025-10-10T00:00:00"}
