{"id":"https://openalex.org/W3162542754","doi":"https://doi.org/10.1109/isqed51717.2021.9424344","title":"Accelerating Transformer-based Deep Learning Models on FPGAs using Column Balanced Block Pruning","display_name":"Accelerating Transformer-based Deep Learning Models on FPGAs using Column Balanced Block Pruning","publication_year":2021,"publication_date":"2021-04-07","ids":{"openalex":"https://openalex.org/W3162542754","doi":"https://doi.org/10.1109/isqed51717.2021.9424344","mag":"3162542754"},"language":"en","primary_location":{"id":"doi:10.1109/isqed51717.2021.9424344","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isqed51717.2021.9424344","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 22nd International Symposium on Quality Electronic Design (ISQED)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045835605","display_name":"Hongwu Peng","orcid":"https://orcid.org/0000-0003-2025-2195"},"institutions":[{"id":"https://openalex.org/I140172145","display_name":"University of Connecticut","ror":"https://ror.org/02der9h97","country_code":"US","type":"education","lineage":["https://openalex.org/I140172145"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hongwu Peng","raw_affiliation_strings":["University of Connecticut, Storrs, CT, USA"],"affiliations":[{"raw_affiliation_string":"University of Connecticut, Storrs, CT, USA","institution_ids":["https://openalex.org/I140172145"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073345631","display_name":"Shaoyi Huang","orcid":"https://orcid.org/0000-0001-6093-9798"},"institutions":[{"id":"https://openalex.org/I140172145","display_name":"University of Connecticut","ror":"https://ror.org/02der9h97","country_code":"US","type":"education","lineage":["https://openalex.org/I140172145"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shaoyi Huang","raw_affiliation_strings":["University of Connecticut, Storrs, CT, USA"],"affiliations":[{"raw_affiliation_string":"University of Connecticut, Storrs, CT, USA","institution_ids":["https://openalex.org/I140172145"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078443672","display_name":"Tong Geng","orcid":"https://orcid.org/0000-0002-3644-2922"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tong Geng","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, WA, USA"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, WA, USA","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100413657","display_name":"Ang Li","orcid":"https://orcid.org/0000-0003-3734-9137"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ang Li","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, WA, USA"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, WA, USA","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019027088","display_name":"Weiwen Jiang","orcid":"https://orcid.org/0000-0002-9004-487X"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Weiwen Jiang","raw_affiliation_strings":["University of Notre Dame, Notre Dame, IN, USA"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame, Notre Dame, IN, USA","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119011911","display_name":"Hang Liu","orcid":"https://orcid.org/0009-0001-2928-1040"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hang Liu","raw_affiliation_strings":["Stevens Institute of Technology, Hoboken, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Stevens Institute of Technology, Hoboken, NJ, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100661401","display_name":"Shusen Wang","orcid":"https://orcid.org/0000-0003-3928-6782"},"institutions":[{"id":"https://openalex.org/I108468826","display_name":"Stevens Institute of Technology","ror":"https://ror.org/02z43xh36","country_code":"US","type":"education","lineage":["https://openalex.org/I108468826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shusen Wang","raw_affiliation_strings":["Stevens Institute of Technology, Hoboken, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Stevens Institute of Technology, Hoboken, NJ, USA","institution_ids":["https://openalex.org/I108468826"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030060072","display_name":"Caiwen Ding","orcid":"https://orcid.org/0000-0003-0891-1231"},"institutions":[{"id":"https://openalex.org/I140172145","display_name":"University of Connecticut","ror":"https://ror.org/02der9h97","country_code":"US","type":"education","lineage":["https://openalex.org/I140172145"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Caiwen Ding","raw_affiliation_strings":["University of Connecticut, Storrs, CT, USA"],"affiliations":[{"raw_affiliation_string":"University of Connecticut, Storrs, CT, USA","institution_ids":["https://openalex.org/I140172145"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5045835605"],"corresponding_institution_ids":["https://openalex.org/I140172145"],"apc_list":null,"apc_paid":null,"fwci":7.8952,"has_fulltext":false,"cited_by_count":102,"citation_normalized_percentile":{"value":0.98140984,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"142","last_page":"148"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.71393883228302},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6814488172531128},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5486269593238831},{"id":"https://openalex.org/keywords/gate-array","display_name":"Gate array","score":0.4875001609325409},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.48286134004592896},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.41985398530960083},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3239253759384155},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.304178923368454},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12056678533554077},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.0786983072757721}],"concepts":[{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.71393883228302},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6814488172531128},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5486269593238831},{"id":"https://openalex.org/C114237110","wikidata":"https://www.wikidata.org/wiki/Q114901","display_name":"Gate array","level":3,"score":0.4875001609325409},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.48286134004592896},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.41985398530960083},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3239253759384155},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.304178923368454},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12056678533554077},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0786983072757721},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isqed51717.2021.9424344","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isqed51717.2021.9424344","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 22nd International Symposium on Quality Electronic Design (ISQED)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W2064675550","https://openalex.org/W2119144962","https://openalex.org/W2177436562","https://openalex.org/W2527036487","https://openalex.org/W2585720638","https://openalex.org/W2588448445","https://openalex.org/W2798170643","https://openalex.org/W2803374624","https://openalex.org/W2896457183","https://openalex.org/W2899244816","https://openalex.org/W2915106038","https://openalex.org/W2962820060","https://openalex.org/W2963000224","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W2963494889","https://openalex.org/W2964033223","https://openalex.org/W2964199361","https://openalex.org/W2964299589","https://openalex.org/W2965373594","https://openalex.org/W2978017171","https://openalex.org/W2998342322","https://openalex.org/W3035038672","https://openalex.org/W3037115325","https://openalex.org/W3047848469","https://openalex.org/W3094502228","https://openalex.org/W3096609285","https://openalex.org/W3104216863","https://openalex.org/W3132616766","https://openalex.org/W4298422451","https://openalex.org/W4299809807","https://openalex.org/W4385245566","https://openalex.org/W6677580257","https://openalex.org/W6685823913","https://openalex.org/W6725543821","https://openalex.org/W6727099177","https://openalex.org/W6739901393","https://openalex.org/W6750209611","https://openalex.org/W6755207826","https://openalex.org/W6766673545","https://openalex.org/W6768851824","https://openalex.org/W6776676620","https://openalex.org/W6780302750","https://openalex.org/W6782869744","https://openalex.org/W6784333009","https://openalex.org/W6785708172"],"related_works":["https://openalex.org/W4206178588","https://openalex.org/W4287635093","https://openalex.org/W3094491777","https://openalex.org/W3214715529","https://openalex.org/W2014165129","https://openalex.org/W2367348190","https://openalex.org/W594316872","https://openalex.org/W2831860248","https://openalex.org/W2367794224","https://openalex.org/W2072850836"],"abstract_inverted_index":{"Although":[0],"Transformer-based":[1],"language":[2,10],"representations":[3],"achieve":[4],"state-of-the-art":[5],"accuracy":[6],"on":[7,48,57,72,104],"various":[8],"natural":[9],"processing":[11],"(NLP)":[12],"tasks,":[13],"the":[14,21,36,43,51,67,82,89,97,101,111],"large":[15],"model":[16,91],"size":[17,113],"has":[18,45],"been":[19,46],"challenging":[20],"resource":[22],"constrained":[23],"computing":[24],"platforms.":[25],"Weight":[26],"pruning,":[27],"as":[28],"a":[29],"popular":[30],"and":[31,41,74,96,126],"effective":[32],"technique":[33],"in":[34],"reducing":[35],"number":[37],"of":[38,114],"weight":[39,55],"parameters":[40],"accelerating":[42],"Transformer,":[44],"investigated":[47],"GPUs.":[49],"However,":[50],"Transformer":[52,73,90,102],"acceleration":[53,78],"using":[54],"pruning":[56,71],"field-programmable":[58],"gate":[59],"array":[60],"(FPGAs)":[61],"remains":[62],"unexplored.":[63],"This":[64],"paper":[65],"investigates":[66],"column":[68],"balanced":[69,83],"block-wise":[70],"designs":[75],"an":[76],"FPGA":[77,105],"engine":[79],"to":[80,123,132],"customize":[81],"blockwise":[84],"matrix":[85],"multiplication.":[86],"We":[87],"implement":[88],"with":[92,110],"proper":[93],"hardware":[94],"scheduling,":[95],"experiments":[98],"show":[99],"that":[100],"inference":[103],"achieves":[106],"10.35":[107],"ms":[108],"latency":[109],"batch":[112],"32,":[115],"which":[116],"is":[117],"10.96":[118],"*":[119,128],"speed":[120,129],"up":[121,130],"comparing":[122,131],"CPU":[124],"platform":[125],"2.08":[127],"GPU":[133],"platform.":[134]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":21},{"year":2024,"cited_by_count":30},{"year":2023,"cited_by_count":25},{"year":2022,"cited_by_count":19},{"year":2021,"cited_by_count":4}],"updated_date":"2026-03-31T07:56:22.981413","created_date":"2025-10-10T00:00:00"}
