{"id":"https://openalex.org/W4408563999","doi":"https://doi.org/10.1109/tcsi.2025.3549060","title":"Topkima-Former: Low-Energy, Low-Latency Inference for Transformers Using Top- <i>k</i> In-Memory ADC","display_name":"Topkima-Former: Low-Energy, Low-Latency Inference for Transformers Using Top- <i>k</i> In-Memory ADC","publication_year":2025,"publication_date":"2025-03-18","ids":{"openalex":"https://openalex.org/W4408563999","doi":"https://doi.org/10.1109/tcsi.2025.3549060"},"language":"en","primary_location":{"id":"doi:10.1109/tcsi.2025.3549060","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2025.3549060","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Shuai Dong","orcid":"https://orcid.org/0009-0007-4807-5094"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Shuai Dong","raw_affiliation_strings":["Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong"],"raw_orcid":"https://orcid.org/0009-0007-4807-5094","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]},{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001439194","display_name":"Junyi Yang","orcid":"https://orcid.org/0000-0002-5867-4943"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Junyi Yang","raw_affiliation_strings":["Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong"],"raw_orcid":"https://orcid.org/0000-0002-5867-4943","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]},{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102547113","display_name":"Xiaoqi Peng","orcid":"https://orcid.org/0009-0005-7716-5318"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Xiaoqi Peng","raw_affiliation_strings":["Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong"],"raw_orcid":"https://orcid.org/0009-0005-7716-5318","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]},{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109797096","display_name":"H. Shang","orcid":"https://orcid.org/0009-0007-6276-1947"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Hongyang Shang","raw_affiliation_strings":["Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong"],"raw_orcid":"https://orcid.org/0009-0007-6276-1947","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]},{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104284748","display_name":"Ye Ke","orcid":"https://orcid.org/0009-0002-9809-1192"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Ye Ke","raw_affiliation_strings":["Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong"],"raw_orcid":"https://orcid.org/0009-0002-9809-1192","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]},{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063285225","display_name":"Xiaofeng Yang","orcid":"https://orcid.org/0000-0003-1400-7994"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiaofeng Yang","raw_affiliation_strings":["Reexen Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-1400-7994","affiliations":[{"raw_affiliation_string":"Reexen Technology, Shenzhen, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010273308","display_name":"H. Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hongjie Liu","raw_affiliation_strings":["Reexen Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0005-0904-5736","affiliations":[{"raw_affiliation_string":"Reexen Technology, Shenzhen, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002380437","display_name":"Arindam Basu","orcid":"https://orcid.org/0000-0003-1035-8770"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Arindam Basu","raw_affiliation_strings":["Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong"],"raw_orcid":"https://orcid.org/0000-0003-1035-8770","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]},{"raw_affiliation_string":"Department of Electrical Engineering, City University of Hong Kong, Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.5825,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.89083417,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"72","issue":"6","first_page":"2509","last_page":"2519"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10472","display_name":"Semiconductor materials and devices","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5513524413108826},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5100651383399963},{"id":"https://openalex.org/keywords/successive-approximation-adc","display_name":"Successive approximation ADC","score":0.48008662462234497},{"id":"https://openalex.org/keywords/electronic-engineering","display_name":"Electronic engineering","score":0.4511508047580719},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.34638431668281555},{"id":"https://openalex.org/keywords/capacitor","display_name":"Capacitor","score":0.24647632241249084},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.20862668752670288},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.19944453239440918}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5513524413108826},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5100651383399963},{"id":"https://openalex.org/C60154766","wikidata":"https://www.wikidata.org/wiki/Q2650458","display_name":"Successive approximation ADC","level":4,"score":0.48008662462234497},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.4511508047580719},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.34638431668281555},{"id":"https://openalex.org/C52192207","wikidata":"https://www.wikidata.org/wiki/Q5322","display_name":"Capacitor","level":3,"score":0.24647632241249084},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.20862668752670288},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.19944453239440918}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsi.2025.3549060","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2025.3549060","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8299999833106995,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W206948248","https://openalex.org/W2020003503","https://openalex.org/W2042519306","https://openalex.org/W2114833655","https://openalex.org/W2167148127","https://openalex.org/W2906917284","https://openalex.org/W2946480111","https://openalex.org/W2963899139","https://openalex.org/W2964176059","https://openalex.org/W3017968097","https://openalex.org/W3044192339","https://openalex.org/W3094502228","https://openalex.org/W3112740243","https://openalex.org/W3115909741","https://openalex.org/W3139521791","https://openalex.org/W3159727696","https://openalex.org/W3189877953","https://openalex.org/W3211525823","https://openalex.org/W4205141919","https://openalex.org/W4214833843","https://openalex.org/W4226402784","https://openalex.org/W4281874271","https://openalex.org/W4293023328","https://openalex.org/W4293768835","https://openalex.org/W4312847929","https://openalex.org/W4360832001","https://openalex.org/W4378801105","https://openalex.org/W4381233128","https://openalex.org/W4387042316","https://openalex.org/W4389166707","https://openalex.org/W4389459141","https://openalex.org/W4390017976","https://openalex.org/W4400726540","https://openalex.org/W4405267264","https://openalex.org/W6691766336","https://openalex.org/W6755207826","https://openalex.org/W6788001715","https://openalex.org/W6810643285"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2864363823"],"abstract_inverted_index":{"Transformer":[0],"has":[1],"emerged":[2],"as":[3,138],"a":[4,26,104,120,149,201,206],"leading":[5],"architecture":[6,50,145],"in":[7,251],"neural":[8],"language":[9],"processing":[10],"(NLP)":[11],"and":[12,32,49,157,181,205,228,254],"computer":[13],"vision":[14,253],"(CV).":[15],"However,":[16],"the":[17,38,46,54,57,81,94,101,115,127,144],"extensive":[18],"use":[19],"of":[20,37,98],"nonlinear":[21],"operations,":[22],"like":[23],"softmax,":[24],"poses":[25],"performance":[27],"bottleneck":[28],"during":[29,114],"transformer":[30],"inference":[31],"comprises":[33],"up":[34],"to":[35,52,72,89,125,200,244],"40%":[36],"total":[39],"latency.":[40],"Hence,":[41],"we":[42,60,147],"propose":[43,61],"innovations":[44],"at":[45],"circuit,":[47],"algorithm":[48],"levels":[51],"accelerate":[53],"transformer.":[55],"At":[56,100,143],"circuit":[58],"level,":[59,103,146],"Topkima\u2014combining":[62],"top-<italic":[63,109,140,208],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[64,83,110,122,135,141,173,183,209,222,230],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">k</i>":[65,84,111,123,136,210],"activation":[66],"selection":[67],"with":[68,119],"in-memory":[69],"ADC":[70],"(IMA)":[71],"implement":[73],"efficient":[74],"softmax":[75,90,203,212,217],"without":[76],"any":[77],"sorting":[78],"overhead.":[79],"Only":[80],"<italic":[82],"largest":[85],"activations":[86,112],"are":[87],"sent":[88],"calculation":[91],"block,":[92],"reducing":[93],"huge":[95],"computational":[96],"cost":[97],"softmax.":[99],"algorithmic":[102],"modified":[105],"training":[106],"scheme":[107],"utilizes":[108],"only":[113],"forward":[116],"pass,":[117],"combined":[118,167],"sub-top-<italic":[121,134],"method":[124],"address":[126],"crossbar":[128],"size":[129],"limitation":[130],"by":[131],"aggregating":[132],"each":[133],"values":[137],"global":[139],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">k</i>.":[142],"introduce":[148],"fine":[150],"pipeline":[151],"for":[152,162,248],"efficiently":[153],"scheduling":[154],"data":[155],"flows":[156],"an":[158],"improved":[159],"scale-free":[160],"technique":[161],"removing":[163],"scaling":[164],"cost.":[165],"The":[166],"system,":[168],"dubbed":[169],"Topkima-Former,":[170],"enhances":[171],"<inline-formula":[172,182,221,229],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[174,184,223,231],"<tex-math":[175,185,224,232],"notation=\"LaTeX\">$1.8\\times":[176],"-84\\times":[177],"$":[178,188,226,234],"</tex-math></inline-formula>":[179,189,227,235],"speedup":[180],"notation=\"LaTeX\">$1.2\\times":[186],"-36\\times":[187],"energy":[190],"efficiency":[191],"(EE)":[192],"over":[193],"prior":[194],"In-memory":[195],"computing":[196],"(IMC)":[197],"accelerators.":[198],"Compared":[199],"conventional":[202],"macro":[204,218],"digital":[207],"(Dtopk)":[211],"macro,":[213],"our":[214],"proposed":[215],"Topkima":[216],"achieves":[219],"about":[220],"notation=\"LaTeX\">$15\\times":[225],"notation=\"LaTeX\">$8\\times":[233],"faster":[236],"speed":[237],"respectively.":[238],"Experimental":[239],"evaluations":[240],"demonstrate":[241],"minimal":[242],"(0.42%":[243],"1.60%)":[245],"accuracy":[246],"loss":[247],"different":[249],"models":[250],"both":[252],"NLP":[255],"tasks.":[256]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":2}],"updated_date":"2026-06-19T17:40:00.097472","created_date":"2025-03-19T00:00:00"}
