{"id":"https://openalex.org/W4404688000","doi":"https://doi.org/10.1109/tvlsi.2024.3488782","title":"MASL-AFU: A High Memory Access Efficiency 2-D Scalable LUT-Based Activation Function Unit for On-Device DNN Training","display_name":"MASL-AFU: A High Memory Access Efficiency 2-D Scalable LUT-Based Activation Function Unit for On-Device DNN Training","publication_year":2024,"publication_date":"2024-11-25","ids":{"openalex":"https://openalex.org/W4404688000","doi":"https://doi.org/10.1109/tvlsi.2024.3488782"},"language":"en","primary_location":{"id":"doi:10.1109/tvlsi.2024.3488782","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvlsi.2024.3488782","pdf_url":null,"source":{"id":"https://openalex.org/S37538908","display_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","issn_l":"1063-8210","issn":["1063-8210","1557-9999"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035973043","display_name":"Zhaoteng Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhaoteng Meng","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Science, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Science, Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100772108","display_name":"Lin Shu","orcid":"https://orcid.org/0000-0001-7468-8766"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Shu","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Science, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Science, Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099431832","display_name":"Jianing Zeng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianing Zeng","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Science, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Science, Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101265571","display_name":"Zhan Li","orcid":"https://orcid.org/0000-0001-8735-2620"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhan Li","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Science, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Science, Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106521688","display_name":"Kailin Lv","orcid":null},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kailin Lv","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Science, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Science, Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047646574","display_name":"Haoyue Yang","orcid":"https://orcid.org/0000-0001-8867-6504"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyue Yang","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Science, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Science, Beijing, China","institution_ids":["https://openalex.org/I4210094879"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108059994","display_name":"Jie Hao","orcid":"https://orcid.org/0000-0002-0273-8047"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Hao","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Science, Beijing, China","Institute of Automation, Chinese Academy of Science, Beijing"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Science, Beijing, China","institution_ids":["https://openalex.org/I4210094879"]},{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Science, Beijing","institution_ids":["https://openalex.org/I4210094879"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5035973043"],"corresponding_institution_ids":["https://openalex.org/I4210094879"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.23898493,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"33","issue":"3","first_page":"707","last_page":"719"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9549999833106995,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9549999833106995,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9386000037193298,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.9381999969482422,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lookup-table","display_name":"Lookup table","score":0.711357831954956},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5696976780891418},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5519489645957947},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.5454176664352417},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4397450089454651},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.40802037715911865},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3499569892883301},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1283780038356781},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.08126288652420044},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.06681549549102783}],"concepts":[{"id":"https://openalex.org/C134835016","wikidata":"https://www.wikidata.org/wiki/Q690265","display_name":"Lookup table","level":2,"score":0.711357831954956},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5696976780891418},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5519489645957947},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.5454176664352417},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4397450089454651},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.40802037715911865},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3499569892883301},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1283780038356781},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.08126288652420044},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.06681549549102783},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tvlsi.2024.3488782","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvlsi.2024.3488782","pdf_url":null,"source":{"id":"https://openalex.org/S37538908","display_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","issn_l":"1063-8210","issn":["1063-8210","1557-9999"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.8100000023841858}],"awards":[{"id":"https://openalex.org/G8323016548","display_name":null,"funder_award_id":"62236007","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1991151262","https://openalex.org/W2018435387","https://openalex.org/W2108598243","https://openalex.org/W2131763976","https://openalex.org/W2137983211","https://openalex.org/W2591659919","https://openalex.org/W2896478499","https://openalex.org/W2903610779","https://openalex.org/W2920954974","https://openalex.org/W2921918777","https://openalex.org/W2963367920","https://openalex.org/W2969262604","https://openalex.org/W2982144630","https://openalex.org/W2999842097","https://openalex.org/W3011338798","https://openalex.org/W3016021860","https://openalex.org/W3034429256","https://openalex.org/W3048842964","https://openalex.org/W3103355636","https://openalex.org/W3116653680","https://openalex.org/W3135859967","https://openalex.org/W3136275618","https://openalex.org/W3160664745","https://openalex.org/W3189138869","https://openalex.org/W3207265322","https://openalex.org/W3208821873","https://openalex.org/W3211525823","https://openalex.org/W4281660701","https://openalex.org/W4285814381","https://openalex.org/W4293025109","https://openalex.org/W4293195632","https://openalex.org/W4312204776","https://openalex.org/W4312373098","https://openalex.org/W4327930476","https://openalex.org/W4380880261","https://openalex.org/W4385300578","https://openalex.org/W4385451479","https://openalex.org/W4386764151","https://openalex.org/W4386765242","https://openalex.org/W4389041331","https://openalex.org/W4389163044","https://openalex.org/W4390874053","https://openalex.org/W4390904880","https://openalex.org/W6737664043","https://openalex.org/W6745245109","https://openalex.org/W6762718338","https://openalex.org/W6838539104"],"related_works":["https://openalex.org/W2798215405","https://openalex.org/W2990962948","https://openalex.org/W230091440","https://openalex.org/W2084169748","https://openalex.org/W2233261550","https://openalex.org/W2810751659","https://openalex.org/W258997015","https://openalex.org/W2997094352","https://openalex.org/W2127529229","https://openalex.org/W2125609625"],"abstract_inverted_index":{"On-device":[0],"deep":[1],"neural":[2],"network":[3],"(DNN)":[4],"training":[5,21,47],"faces":[6],"constraints":[7],"in":[8,75,93,121,158],"storage":[9],"capacity":[10],"and":[11,24,35,136,160,174,198],"energy":[12,38,199],"supply.":[13],"Existing":[14],"works":[15],"primarily":[16],"focus":[17],"on":[18],"optimizing":[19],"the":[20,31,37,46,55,72,89,94,98,111,117,129,175],"of":[22,40,48,116,128,170,177],"convolutional":[23],"batch":[25],"normalization":[26],"(BN)":[27],"layers":[28,50],"to":[29,54,70,86,140,148,190,203],"improve":[30],"compute-to-communication":[32],"(CTC)":[33],"ratio":[34],"reduce":[36],"cost":[39],"off-chip":[41,57,161],"memory":[42],"access":[43],"(MA).":[44],"However,":[45],"activation":[49,73,95,131,142],"remains":[51],"challenging":[52],"due":[53],"additional":[56],"MA":[58,162],"required":[59],"for":[60,113],"derivative":[61],"calculations.":[62],"This":[63],"article":[64],"proposes":[65],"MASL-AFU,":[66],"an":[67],"architecture":[68],"designed":[69],"accelerate":[71],"layer":[74],"on-device":[76],"DNN":[77],"training.":[78],"MASL-AFU":[79,133,145,166],"leverages":[80],"nonuniform":[81],"piecewise":[82],"linear":[83],"(NUPWL)":[84],"functions":[85],"speed":[87],"up":[88,147,189,202],"forward":[90],"propagation":[91,100],"(FP)":[92],"layer.":[96],"During":[97],"error":[99],"(EP)":[101],"process,":[102],"retrieving":[103],"derivatives":[104],"from":[105],"a":[106,149],"lookup":[107],"table":[108],"(LUT)":[109],"eliminates":[110],"need":[112],"redundant":[114],"retrieval":[115],"input":[118],"data":[119,172],"used":[120],"FP.":[122],"By":[123],"storing":[124],"LUT":[125,178],"indices":[126],"instead":[127],"original":[130],"inputs,":[132],"significantly":[134],"reduces":[135],"accelerates":[137],"MA.":[138],"Compared":[139],"other":[141],"function":[143],"units,":[144],"offers":[146],"<inline-formula":[150,191,204],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[151,192,205],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[152,193,206],"<tex-math":[153,194,207],"notation=\"LaTeX\">$5.8\\times":[154],"$":[155,196,209],"</tex-math></inline-formula>":[156,197],"increase":[157],"computational":[159],"efficiency.":[163],"In":[164],"addition,":[165],"incorporates":[167],"two":[168],"dimensions":[169],"scalability:":[171],"precision":[173],"number":[176],"entries.":[179],"These":[180],"scalable,":[181],"hardware-friendly":[182],"methods":[183],"enhance":[184],"MASL-AFU\u2019s":[185],"area":[186],"efficiency":[187,200],"by":[188,201],"notation=\"LaTeX\">$3.24\\times":[195],"notation=\"LaTeX\">$3.85\\times":[208],"</tex-math></inline-formula>.":[210]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
