{"id":"https://openalex.org/W4407720853","doi":"https://doi.org/10.1109/iceic64972.2025.10879696","title":"MOSA: Matrix Optimized Self-Attention Hardware Accelerator for Mobile Device","display_name":"MOSA: Matrix Optimized Self-Attention Hardware Accelerator for Mobile Device","publication_year":2025,"publication_date":"2025-01-19","ids":{"openalex":"https://openalex.org/W4407720853","doi":"https://doi.org/10.1109/iceic64972.2025.10879696"},"language":"en","primary_location":{"id":"doi:10.1109/iceic64972.2025.10879696","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iceic64972.2025.10879696","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Electronics, Information, and Communication (ICEIC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059080461","display_name":"Y.C. Chang","orcid":null},"institutions":[{"id":"https://openalex.org/I107470533","display_name":"Tamkang University","ror":"https://ror.org/04tft4718","country_code":"TW","type":"education","lineage":["https://openalex.org/I107470533"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Yang-Rwei Chang","raw_affiliation_strings":["Tamkang University,Dept. Electrical and Computer Engineering,New Taipei City,Taiwan R.O.C"],"affiliations":[{"raw_affiliation_string":"Tamkang University,Dept. Electrical and Computer Engineering,New Taipei City,Taiwan R.O.C","institution_ids":["https://openalex.org/I107470533"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hsuan-Fu Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I107470533","display_name":"Tamkang University","ror":"https://ror.org/04tft4718","country_code":"TW","type":"education","lineage":["https://openalex.org/I107470533"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Hsuan-Fu Chen","raw_affiliation_strings":["Tamkang University,Dept. Electrical and Computer Engineering,New Taipei City,Taiwan R.O.C"],"affiliations":[{"raw_affiliation_string":"Tamkang University,Dept. Electrical and Computer Engineering,New Taipei City,Taiwan R.O.C","institution_ids":["https://openalex.org/I107470533"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084451408","display_name":"Horng-Yuan Shih","orcid":"https://orcid.org/0000-0002-0802-9436"},"institutions":[{"id":"https://openalex.org/I107470533","display_name":"Tamkang University","ror":"https://ror.org/04tft4718","country_code":"TW","type":"education","lineage":["https://openalex.org/I107470533"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Horng-Yuan Shih","raw_affiliation_strings":["Tamkang University,Dept. Electrical and Computer Engineering,New Taipei City,Taiwan R.O.C"],"affiliations":[{"raw_affiliation_string":"Tamkang University,Dept. Electrical and Computer Engineering,New Taipei City,Taiwan R.O.C","institution_ids":["https://openalex.org/I107470533"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5059080461"],"corresponding_institution_ids":["https://openalex.org/I107470533"],"apc_list":null,"apc_paid":null,"fwci":2.1376,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.81128966,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9351000189781189,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9351000189781189,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7084968686103821},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.5976649522781372},{"id":"https://openalex.org/keywords/mobile-device","display_name":"Mobile device","score":0.5077698826789856},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.4498141407966614},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.356046199798584},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.23703065514564514},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.23342043161392212}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7084968686103821},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.5976649522781372},{"id":"https://openalex.org/C186967261","wikidata":"https://www.wikidata.org/wiki/Q5082128","display_name":"Mobile device","level":2,"score":0.5077698826789856},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.4498141407966614},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.356046199798584},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.23703065514564514},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.23342043161392212}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iceic64972.2025.10879696","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iceic64972.2025.10879696","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Electronics, Information, and Communication (ICEIC)","raw_type":"proceedings-article"},{"id":"pmh:oai:tkuir.lib.tku.edu.tw:987654321/128112","is_oa":false,"landing_page_url":"https://tkuir.lib.tku.edu.tw/dspace/handle/987654321/128112","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":2,"referenced_works":["https://openalex.org/W2289252105","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W3152699334","https://openalex.org/W2127760637","https://openalex.org/W2390254310"],"abstract_inverted_index":{"The":[0],"Self-Attention":[1,85],"mechanism,":[2],"which":[3,128],"lies":[4],"at":[5],"the":[6,54,95,99,111,153,156,171],"core":[7],"of":[8,56],"Transformer":[9],"architectures,":[10],"plays":[11],"a":[12,84],"vital":[13],"role":[14],"in":[15,50],"capturing":[16],"long-range":[17],"dependencies.":[18],"However,":[19],"its":[20],"high":[21],"computational":[22,113,149,165],"complexity":[23],"and":[24,43,67,105,125,178,206],"significant":[25],"memory":[26,41,69,106,123,131],"requirements":[27],"pose":[28],"major":[29],"challenges":[30],"for":[31,60,73,90,158],"resource-constrained":[32],"hardware":[33,58,86,191],"such":[34,202],"as":[35,203],"mobile":[36,79,91,193],"devices.":[37,80,92],"In":[38,151],"particular,":[39],"frequent":[40,122],"accesses":[42],"inefficient":[44],"matrix":[45,65,96],"multiplication":[46,97],"operations":[47,66],"often":[48],"result":[49],"performance":[51],"bottlenecks.":[52],"Therefore,":[53],"development":[55],"dedicated":[57],"accelerators":[59],"Self-Attention,":[61],"focusing":[62],"on":[63,78,142],"optimizing":[64,94],"reducing":[68],"usage,":[70],"is":[71,174],"essential":[72],"improving":[74],"AI":[75],"processing":[76,205],"efficiency":[77],"This":[81,134],"paper":[82],"presents":[83],"accelerator":[87,100,154],"designed":[88],"specifically":[89],"By":[93],"process,":[98],"effectively":[101],"reduces":[102,130],"data":[103,135],"transmission":[104,181],"access":[107],"frequency,":[108],"thereby":[109],"lowering":[110],"overall":[112],"complexity.":[114],"It":[115],"also":[116,146],"reuses":[117],"intermediate":[118],"computation":[119],"results,":[120],"minimizing":[121],"read":[124],"write":[126],"operations,":[127,161],"significantly":[129],"bandwidth":[132],"requirements.":[133],"reuse":[136],"strategy":[137],"not":[138],"only":[139],"cuts":[140],"down":[141],"redundant":[143],"computations":[144],"but":[145],"greatly":[147],"enhances":[148],"efficiency.":[150],"addition,":[152],"eliminates":[155],"need":[157],"Key":[159],"Transpose":[160],"further":[162],"simplifying":[163],"certain":[164],"steps.":[166],"Compared":[167],"to":[168],"traditional":[169],"algorithms,":[170],"idle":[172],"time":[173],"reduced":[175,184],"by":[176,185],"66.5%.,":[177],"signal":[179],"line":[180],"costs":[182],"are":[183],"approximately":[186],"80%.":[187],"With":[188],"an":[189],"optimized":[190],"architecture,":[192],"devices":[194],"can":[195],"efficiently":[196],"support":[197],"complex":[198],"deep":[199],"learning":[200],"applications,":[201],"speech":[204],"image":[207],"recognition.":[208]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
