{"id":"https://openalex.org/W4401211356","doi":"https://doi.org/10.1109/tbcas.2024.3436837","title":"High-Performance Method and Architecture for Attention Computation in DNN Inference","display_name":"High-Performance Method and Architecture for Attention Computation in DNN Inference","publication_year":2024,"publication_date":"2024-08-01","ids":{"openalex":"https://openalex.org/W4401211356","doi":"https://doi.org/10.1109/tbcas.2024.3436837","pmid":"https://pubmed.ncbi.nlm.nih.gov/39088504"},"language":"en","primary_location":{"id":"doi:10.1109/tbcas.2024.3436837","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbcas.2024.3436837","pdf_url":null,"source":{"id":"https://openalex.org/S80299757","display_name":"IEEE Transactions on Biomedical Circuits and Systems","issn_l":"1932-4545","issn":["1932-4545","1940-9990"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Biomedical Circuits and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Qi Cheng","orcid":"https://orcid.org/0009-0001-6045-8959"},"institutions":[{"id":"https://openalex.org/I142108993","display_name":"Southwest University","ror":"https://ror.org/01kj4z117","country_code":"CN","type":"education","lineage":["https://openalex.org/I142108993"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qi Cheng","raw_affiliation_strings":["College of Artificial Intelligence, Southwest University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Southwest University, Chongqing, China","institution_ids":["https://openalex.org/I142108993"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087454088","display_name":"Xiaofang Hu","orcid":"https://orcid.org/0000-0003-3764-2640"},"institutions":[{"id":"https://openalex.org/I142108993","display_name":"Southwest University","ror":"https://ror.org/01kj4z117","country_code":"CN","type":"education","lineage":["https://openalex.org/I142108993"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaofang Hu","raw_affiliation_strings":["College of Artificial Intelligence, Southwest University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Southwest University, Chongqing, China","institution_ids":["https://openalex.org/I142108993"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100719067","display_name":"He Xiao","orcid":"https://orcid.org/0000-0003-0769-0780"},"institutions":[{"id":"https://openalex.org/I142108993","display_name":"Southwest University","ror":"https://ror.org/01kj4z117","country_code":"CN","type":"education","lineage":["https://openalex.org/I142108993"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"He Xiao","raw_affiliation_strings":["College of Artificial Intelligence, Southwest University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Southwest University, Chongqing, China","institution_ids":["https://openalex.org/I142108993"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034322739","display_name":"Yue Zhou","orcid":"https://orcid.org/0009-0006-9839-2947"},"institutions":[{"id":"https://openalex.org/I142108993","display_name":"Southwest University","ror":"https://ror.org/01kj4z117","country_code":"CN","type":"education","lineage":["https://openalex.org/I142108993"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Zhou","raw_affiliation_strings":["College of Artificial Intelligence, Southwest University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Southwest University, Chongqing, China","institution_ids":["https://openalex.org/I142108993"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035048973","display_name":"Shukai Duan","orcid":"https://orcid.org/0000-0002-0040-3796"},"institutions":[{"id":"https://openalex.org/I142108993","display_name":"Southwest University","ror":"https://ror.org/01kj4z117","country_code":"CN","type":"education","lineage":["https://openalex.org/I142108993"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shukai Duan","raw_affiliation_strings":["College of Artificial Intelligence, Southwest University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, Southwest University, Chongqing, China","institution_ids":["https://openalex.org/I142108993"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I142108993"],"apc_list":null,"apc_paid":null,"fwci":0.2378,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.54707446,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"19","issue":"2","first_page":"404","last_page":"415"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9775999784469604,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9775999784469604,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9230999946594238,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9010999798774719,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6890167593955994},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.668120265007019},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6394537687301636},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5947871208190918},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48180192708969116},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.47148749232292175},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.19482189416885376}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6890167593955994},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.668120265007019},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6394537687301636},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5947871208190918},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48180192708969116},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.47148749232292175},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.19482189416885376},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tbcas.2024.3436837","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbcas.2024.3436837","pdf_url":null,"source":{"id":"https://openalex.org/S80299757","display_name":"IEEE Transactions on Biomedical Circuits and Systems","issn_l":"1932-4545","issn":["1932-4545","1940-9990"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Biomedical Circuits and Systems","raw_type":"journal-article"},{"id":"pmid:39088504","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/39088504","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on biomedical circuits and systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2152130785","display_name":null,"funder_award_id":"61976246","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2816725917","display_name":null,"funder_award_id":"CSTB2023NSCQ-MSX0018","funder_id":"https://openalex.org/F4320323172","funder_display_name":"Natural Science Foundation of Chongqing"},{"id":"https://openalex.org/G5602616428","display_name":null,"funder_award_id":"SWU-KR22046","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G571593048","display_name":null,"funder_award_id":"U20A20227","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323172","display_name":"Natural Science Foundation of Chongqing","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W1542981317","https://openalex.org/W2005490094","https://openalex.org/W2082450466","https://openalex.org/W2108505641","https://openalex.org/W2112181056","https://openalex.org/W2154852616","https://openalex.org/W2937064326","https://openalex.org/W2974644665","https://openalex.org/W2982974103","https://openalex.org/W3015729306","https://openalex.org/W3047040508","https://openalex.org/W3174407341","https://openalex.org/W3207846280","https://openalex.org/W4205363571","https://openalex.org/W4206262671","https://openalex.org/W4226030837","https://openalex.org/W4255455317","https://openalex.org/W4286001027","https://openalex.org/W4293768835","https://openalex.org/W4312771985","https://openalex.org/W4316661158","https://openalex.org/W4321479797","https://openalex.org/W4362592573","https://openalex.org/W4367728425","https://openalex.org/W4377001511","https://openalex.org/W4378364815","https://openalex.org/W4379116086","https://openalex.org/W4382677757","https://openalex.org/W4385245566","https://openalex.org/W4385267257","https://openalex.org/W4385300578","https://openalex.org/W4385617056","https://openalex.org/W4386710216","https://openalex.org/W4388979504","https://openalex.org/W4390033950","https://openalex.org/W4390575692","https://openalex.org/W4390575695","https://openalex.org/W4391092774","https://openalex.org/W4391407189","https://openalex.org/W4391768379","https://openalex.org/W4391952650","https://openalex.org/W4392823494","https://openalex.org/W4393033212","https://openalex.org/W4393095888","https://openalex.org/W4394566113","https://openalex.org/W4394596865","https://openalex.org/W4395668837","https://openalex.org/W4399304422","https://openalex.org/W4403210910","https://openalex.org/W6649256720","https://openalex.org/W6853667026"],"related_works":["https://openalex.org/W2055243143","https://openalex.org/W4231775656","https://openalex.org/W2046435967","https://openalex.org/W2383646825","https://openalex.org/W2371018915","https://openalex.org/W2354191502","https://openalex.org/W1972225038","https://openalex.org/W4321636575","https://openalex.org/W3134658850","https://openalex.org/W2038503502"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"The":[3],"combination":[4],"of":[5,15,20,67,97,111,115,150],"Attention":[6,55,68,82,141,167],"mechanism":[7],"and":[8,40,71,77,133,173,183,185],"deep":[9,151],"learning":[10],"has":[11],"a":[12,48],"wide":[13],"range":[14],"applications":[16],"in":[17,69,105],"the":[18,65,81,95,101,109,112,116,131,139,148,159,165,170],"field":[19],"medical":[21],"imaging.":[22],"However,":[23],"due":[24],"to":[25,44,93,107,124],"its":[26,98],"complex":[27],"computational":[28],"processes,":[29],"existing":[30],"hardware":[31,56,70,102,142,168],"architectures":[32],"have":[33],"high":[34],"resource":[35],"consumption":[36],"or":[37],"low":[38],"accuracy,":[39],"deploying":[41],"them":[42],"efficiently":[43],"DNN":[45],"accelerators":[46],"is":[47,85,122,136],"challenge.":[49],"This":[50],"paper":[51],"proposes":[52],"an":[53,118],"online-programmable":[54,119],"architecture":[57,121,143],"based":[58],"on":[59,100,158],"compute-in-memory":[60],"(CIM)":[61],"marco,":[62],"which":[63],"reduces":[64],"complexity":[66,96],"improves":[72],"integration":[73],"density,":[74],"energy":[75,174],"efficiency,":[76],"calculation":[78,126],"accuracy.":[79],"First,":[80],"computation":[83],"process":[84],"decomposed":[86],"into":[87],"multiple":[88],"cascaded":[89],"combinatorial":[90],"matrix":[91],"operations":[92],"reduce":[94,108],"implementation":[99],"side;":[103],"second,":[104],"order":[106],"influence":[110],"non-ideal":[113],"characteristics":[114],"hardware,":[117],"CIM":[120],"designed":[123],"improve":[125],"accuracy":[127],"by":[128,178,190],"dynamically":[129],"adjusting":[130],"weights;":[132],"lastly,":[134],"it":[135],"verified":[137],"that":[138],"proposed":[140],"can":[144],"be":[145],"applied":[146],"for":[147],"inference":[149],"neural":[152],"networks":[153],"through":[154],"Spice":[155],"simulation.":[156],"Based":[157],"100nm":[160],"CMOS":[161],"process,":[162],"compared":[163],"with":[164],"traditional":[166],"architectures,":[169],"integrated":[171],"density":[172],"efficiency":[175,187],"are":[176,188],"increased":[177],"at":[179],"least":[180],"91.38":[181],"times,":[182],"latency":[184],"computing":[186],"improved":[189],"about":[191],"12.5":[192],"times.":[193]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-18T07:56:08.524223","created_date":"2025-10-10T00:00:00"}
