{"id":"https://openalex.org/W4416429881","doi":"https://doi.org/10.1109/iccad66269.2025.11240801","title":"Optimizing Neural Networks with Learnable Non-Linear Activation Functions via Lookup-Based FPGA Acceleration","display_name":"Optimizing Neural Networks with Learnable Non-Linear Activation Functions via Lookup-Based FPGA Acceleration","publication_year":2025,"publication_date":"2025-10-26","ids":{"openalex":"https://openalex.org/W4416429881","doi":"https://doi.org/10.1109/iccad66269.2025.11240801"},"language":null,"primary_location":{"id":"doi:10.1109/iccad66269.2025.11240801","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccad66269.2025.11240801","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/ACM International Conference On Computer Aided Design (ICCAD)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Mengyuan Yin","orcid":null},"institutions":[{"id":"https://openalex.org/I3004594783","display_name":"Institute of High Performance Computing","ror":"https://ror.org/02n0ejh50","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3004594783","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Mengyuan Yin","raw_affiliation_strings":["Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore","institution_ids":["https://openalex.org/I3004594783"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024753648","display_name":"Benjamin Chen Ming Choong","orcid":"https://orcid.org/0009-0007-9343-7517"},"institutions":[{"id":"https://openalex.org/I3004594783","display_name":"Institute of High Performance Computing","ror":"https://ror.org/02n0ejh50","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3004594783","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Benjamin Chen Ming Choong","raw_affiliation_strings":["Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore","institution_ids":["https://openalex.org/I3004594783"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069998800","display_name":"Chuping Qu","orcid":"https://orcid.org/0000-0002-9398-6037"},"institutions":[{"id":"https://openalex.org/I3004594783","display_name":"Institute of High Performance Computing","ror":"https://ror.org/02n0ejh50","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3004594783","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Chuping Qu","raw_affiliation_strings":["Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore","institution_ids":["https://openalex.org/I3004594783"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001599295","display_name":"Rick Siow Mong Goh","orcid":"https://orcid.org/0000-0001-9116-1595"},"institutions":[{"id":"https://openalex.org/I3004594783","display_name":"Institute of High Performance Computing","ror":"https://ror.org/02n0ejh50","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3004594783","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Rick Siow Mong Goh","raw_affiliation_strings":["Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore","institution_ids":["https://openalex.org/I3004594783"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023989495","display_name":"Weng\u2010Fai Wong","orcid":"https://orcid.org/0000-0002-4281-2053"},"institutions":[{"id":"https://openalex.org/I3004594783","display_name":"Institute of High Performance Computing","ror":"https://ror.org/02n0ejh50","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3004594783","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Weng-Fai Wong","raw_affiliation_strings":["Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore","institution_ids":["https://openalex.org/I3004594783"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101630043","display_name":"Tao Luo","orcid":"https://orcid.org/0000-0002-3415-3676"},"institutions":[{"id":"https://openalex.org/I3004594783","display_name":"Institute of High Performance Computing","ror":"https://ror.org/02n0ejh50","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3004594783","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Tao Luo","raw_affiliation_strings":["Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of High Performance Computing, A*STAR, Singapore National University of Singapore,Singapore","institution_ids":["https://openalex.org/I3004594783"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I3004594783"],"apc_list":null,"apc_paid":null,"fwci":0.9775,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.82032262,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.633400022983551,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.633400022983551,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.06040000170469284,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.03500000014901161,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reconfigurability","display_name":"Reconfigurability","score":0.8040000200271606},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.6843000054359436},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.5375000238418579},{"id":"https://openalex.org/keywords/lookup-table","display_name":"Lookup table","score":0.5105000138282776},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.4740999937057495},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.47350001335144043},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4731999933719635},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.46149998903274536},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.4244000017642975}],"concepts":[{"id":"https://openalex.org/C2780149590","wikidata":"https://www.wikidata.org/wiki/Q7302742","display_name":"Reconfigurability","level":2,"score":0.8040000200271606},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6967999935150146},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.6843000054359436},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.5375000238418579},{"id":"https://openalex.org/C134835016","wikidata":"https://www.wikidata.org/wiki/Q690265","display_name":"Lookup table","level":2,"score":0.5105000138282776},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.4740999937057495},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.47350001335144043},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4731999933719635},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.46149998903274536},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.4244000017642975},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.39259999990463257},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.37619999051094055},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.37380000948905945},{"id":"https://openalex.org/C142962650","wikidata":"https://www.wikidata.org/wiki/Q240838","display_name":"Reconfigurable computing","level":3,"score":0.36039999127388},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.350600004196167},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.3391999900341034},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3319999873638153},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.3253999948501587},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.32190001010894775},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.32109999656677246},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.30640000104904175},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C132943942","wikidata":"https://www.wikidata.org/wiki/Q2562511","display_name":"Footprint","level":2,"score":0.2888999879360199},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C164620267","wikidata":"https://www.wikidata.org/wiki/Q376953","display_name":"Adder","level":3,"score":0.2667999863624573},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.25589999556541443},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccad66269.2025.11240801","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccad66269.2025.11240801","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/ACM International Conference On Computer Aided Design (ICCAD)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W2007339694","https://openalex.org/W2201305792","https://openalex.org/W2553754377","https://openalex.org/W2565125333","https://openalex.org/W2583383421","https://openalex.org/W2730411900","https://openalex.org/W2951537853","https://openalex.org/W3000933965","https://openalex.org/W3037632138","https://openalex.org/W3093982621","https://openalex.org/W4200506235","https://openalex.org/W4293025109","https://openalex.org/W4312263904","https://openalex.org/W4312554056","https://openalex.org/W4391455313","https://openalex.org/W4392972248","https://openalex.org/W4404781142"],"related_works":[],"abstract_inverted_index":{"Learned":[0],"activation":[1,76,103,165],"functions":[2,104],"in":[3,12],"models":[4],"like":[5],"Kolmogorov-Arnold":[6],"Networks":[7],"(KANs)":[8],"outperform":[9],"fixed-activation":[10],"architectures":[11],"terms":[13],"of":[14,163],"accuracy":[15,135],"and":[16,35,117,130,136,156],"interpretability;":[17],"however,":[18],"their":[19],"computational":[20,115,154],"complexity":[21],"poses":[22],"critical":[23,107],"challenges":[24],"for":[25,84,90,149],"energy-constrained":[26],"edge":[27,58,91,128,151],"AI":[28],"deployments.":[29],"Conventional":[30],"CPUs/GPUs":[31],"incur":[32],"prohibitive":[33],"latency":[34],"power":[36,157],"costs":[37],"when":[38],"evaluating":[39],"higher":[40,123],"order":[41],"activations,":[42],"limiting":[43],"deployability":[44],"under":[45],"ultra-tight":[46],"energy":[47,124],"budgets.":[48],"We":[49],"address":[50],"this":[51],"via":[52],"a":[53,87,106,146],"reconfigurable":[54],"lookup":[55,66],"architecture":[56],"with":[57,64],"FPGAs.":[59],"By":[60],"coupling":[61],"fine-grained":[62],"quantization":[63],"adaptive":[65,164],"tables,":[67],"our":[68,110,143],"design":[69,112],"minimizes":[70],"energy-intensive":[71],"arithmetic":[72],"operations":[73],"while":[74,132],"preserving":[75],"fidelity.":[77],"FPGA":[78],"reconfigurability":[79],"enables":[80],"dynamic":[81],"hardware":[82],"specialization":[83],"learned":[85],"functions,":[86],"key":[88],"advantage":[89],"systems":[92],"that":[93,109],"require":[94],"post-deployment":[95],"adaptability.":[96],"Evaluations":[97],"using":[98],"KANs":[99],"-":[100],"where":[101,153],"unique":[102],"play":[105],"role\u2014demonstrate":[108],"FPGA-based":[111],"achieves":[113],"superior":[114],"speed":[116],"over":[118],"10<sup":[119],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[120],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">4</sup>":[121],"times":[122],"efficiency":[125],"compared":[126],"to":[127],"CPUs":[129],"GPUs,":[131],"maintaining":[133],"matching":[134],"minimal":[137],"footprint":[138],"overhead.":[139],"This":[140],"breakthrough":[141],"positions":[142],"approach":[144],"as":[145],"practical":[147],"enabler":[148],"energy-critical":[150],"AI,":[152],"intensity":[155],"constraints":[158],"traditionally":[159],"preclude":[160],"the":[161],"use":[162],"networks.":[166]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-05-30T09:04:40.226872","created_date":"2025-11-20T00:00:00"}
