{"id":"https://openalex.org/W3159730268","doi":"https://doi.org/10.1109/iscas51556.2021.9401192","title":"An Energy-Efficient Convolution Unit for Depthwise Separable Convolutional Neural Networks","display_name":"An Energy-Efficient Convolution Unit for Depthwise Separable Convolutional Neural Networks","publication_year":2021,"publication_date":"2021-04-27","ids":{"openalex":"https://openalex.org/W3159730268","doi":"https://doi.org/10.1109/iscas51556.2021.9401192","mag":"3159730268"},"language":"en","primary_location":{"id":"doi:10.1109/iscas51556.2021.9401192","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscas51556.2021.9401192","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Symposium on Circuits and Systems (ISCAS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://dr.ntu.edu.sg/bitstream/10356/152096/2/ISCAS2021%20An_Accelerator_for_Depthwise_Separable_CNN_Final.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019055130","display_name":"Yi Sheng Chong","orcid":"https://orcid.org/0000-0003-4136-6570"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]},{"id":"https://openalex.org/I4210094970","display_name":"Energy Research Institute","ror":"https://ror.org/00ndnb620","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094970","https://openalex.org/I4210142748"]}],"countries":["CN","SG"],"is_corresponding":true,"raw_author_name":"Yi Sheng Chong","raw_affiliation_strings":["Energy Research Institute, Interdisciplinary Graduate Programme, NTU, Singapore","School of Electrical and Electronic Engineering, Nanyang Technological University (NTU), Singapore"],"affiliations":[{"raw_affiliation_string":"Energy Research Institute, Interdisciplinary Graduate Programme, NTU, Singapore","institution_ids":["https://openalex.org/I4210094970"]},{"raw_affiliation_string":"School of Electrical and Electronic Engineering, Nanyang Technological University (NTU), Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042682339","display_name":"Wang Ling Goh","orcid":"https://orcid.org/0000-0001-7466-8941"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Wang Ling Goh","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068243197","display_name":"Yew-Soon Ong","orcid":"https://orcid.org/0000-0002-4480-169X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yew Soon Ong","raw_affiliation_strings":["School of Computer Science and Engineering, NTU, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, NTU, Singapore","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036682724","display_name":"Vishnu P. Nambiar","orcid":"https://orcid.org/0000-0001-5570-5911"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I4210090209","display_name":"Institute of Microelectronics","ror":"https://ror.org/009rw8n36","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I4210090209","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Vishnu P. Nambiar","raw_affiliation_strings":["Institute of Microelectronics, A*STAR, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute of Microelectronics, A*STAR, Singapore","institution_ids":["https://openalex.org/I4210090209","https://openalex.org/I115228651"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101615706","display_name":"Anh Tuan","orcid":"https://orcid.org/0000-0002-8320-6818"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I4210090209","display_name":"Institute of Microelectronics","ror":"https://ror.org/009rw8n36","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I4210090209","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Anh Tuan Do","raw_affiliation_strings":["Institute of Microelectronics, A*STAR, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute of Microelectronics, A*STAR, Singapore","institution_ids":["https://openalex.org/I4210090209","https://openalex.org/I115228651"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5019055130"],"corresponding_institution_ids":["https://openalex.org/I172675005","https://openalex.org/I4210094970"],"apc_list":null,"apc_paid":null,"fwci":0.9684,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.77070053,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.7562615871429443},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7429726123809814},{"id":"https://openalex.org/keywords/pointwise","display_name":"Pointwise","score":0.7260407209396362},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7040601968765259},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.5667656660079956},{"id":"https://openalex.org/keywords/separable-space","display_name":"Separable space","score":0.5147697925567627},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5047630071640015},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.484737366437912},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.48365795612335205},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.46757036447525024},{"id":"https://openalex.org/keywords/cmos","display_name":"CMOS","score":0.42777392268180847},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3630651533603668},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3525437116622925},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3252946734428406},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.31120565533638},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19094905257225037},{"id":"https://openalex.org/keywords/electronic-engineering","display_name":"Electronic engineering","score":0.17490187287330627},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14998221397399902}],"concepts":[{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.7562615871429443},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7429726123809814},{"id":"https://openalex.org/C2777984123","wikidata":"https://www.wikidata.org/wiki/Q9248237","display_name":"Pointwise","level":2,"score":0.7260407209396362},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7040601968765259},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.5667656660079956},{"id":"https://openalex.org/C70710897","wikidata":"https://www.wikidata.org/wiki/Q680081","display_name":"Separable space","level":2,"score":0.5147697925567627},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5047630071640015},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.484737366437912},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.48365795612335205},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.46757036447525024},{"id":"https://openalex.org/C46362747","wikidata":"https://www.wikidata.org/wiki/Q173431","display_name":"CMOS","level":2,"score":0.42777392268180847},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3630651533603668},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3525437116622925},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3252946734428406},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.31120565533638},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19094905257225037},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.17490187287330627},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14998221397399902},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iscas51556.2021.9401192","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscas51556.2021.9401192","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Symposium on Circuits and Systems (ISCAS)","raw_type":"proceedings-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/152096","is_oa":true,"landing_page_url":"https://hdl.handle.net/10356/152096","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/152096/2/ISCAS2021%20An_Accelerator_for_Depthwise_Separable_CNN_Final.pdf","source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference Paper"}],"best_oa_location":{"id":"pmh:oai:dr.ntu.edu.sg:10356/152096","is_oa":true,"landing_page_url":"https://hdl.handle.net/10356/152096","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/152096/2/ISCAS2021%20An_Accelerator_for_Depthwise_Separable_CNN_Final.pdf","source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference Paper"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.9100000262260437,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3159730268.pdf"},"referenced_works_count":19,"referenced_works":["https://openalex.org/W1578218114","https://openalex.org/W2125066085","https://openalex.org/W2260498192","https://openalex.org/W2289252105","https://openalex.org/W2531409750","https://openalex.org/W2565960208","https://openalex.org/W2604319603","https://openalex.org/W2612445135","https://openalex.org/W2782812883","https://openalex.org/W2808463410","https://openalex.org/W2887936511","https://openalex.org/W2946289095","https://openalex.org/W2963163009","https://openalex.org/W3024621361","https://openalex.org/W4297775537","https://openalex.org/W6696405057","https://openalex.org/W6728184133","https://openalex.org/W6737664043","https://openalex.org/W6749781174"],"related_works":["https://openalex.org/W143502885","https://openalex.org/W4361003569","https://openalex.org/W2530952058","https://openalex.org/W2981421796","https://openalex.org/W2582836483","https://openalex.org/W4299366318","https://openalex.org/W3158431807","https://openalex.org/W4297580547","https://openalex.org/W2951583185","https://openalex.org/W4308155352"],"abstract_inverted_index":{"High":[0],"performance":[1],"but":[2],"computationally":[3],"expensive":[4],"Convolutional":[5],"Neural":[6],"Networks":[7],"(CNNs)":[8],"require":[9],"both":[10],"algorithmic":[11],"and":[12,20,43,68],"custom":[13],"hardware":[14],"improvement":[15],"to":[16,21,36,77,88],"reduce":[17,37],"model":[18],"size":[19],"improve":[22],"energy":[23,119],"efficiency":[24,108],"for":[25,66,118],"edge":[26,121],"computing":[27,122],"applications.":[28,123],"Recent":[29],"CNN":[30,57],"architectures":[31],"employ":[32],"depthwise":[33,47,69],"separable":[34,48],"convolution":[35,49,93],"the":[38,96],"total":[39],"number":[40],"of":[41,109],"weights":[42],"MAC":[44],"operations.":[45],"However,":[46],"workload":[50],"does":[51],"not":[52],"run":[53],"efficiently":[54],"in":[55,91],"existing":[56],"accelerators.":[58],"This":[59],"paper":[60],"proposes":[61],"an":[62],"energy-efficient":[63],"CONV":[64,72],"unit":[65,73],"pointwise":[67,92],"operation.":[70],"The":[71,81],"utilizes":[74],"weight":[75],"stationary":[76],"enable":[78],"high":[79],"efficiency.":[80],"row":[82],"partial":[83,101],"sum":[84],"reduction":[85],"is":[86,116],"engaged":[87],"increase":[89],"parallelism":[90],"thereby":[94],"lightening":[95],"memory":[97],"requirements":[98],"on":[99],"output":[100],"sums.":[102],"Our":[103],"design":[104],"achieves":[105],"a":[106],"maximum":[107],"3.17":[110],"TOPS/W":[111],"at":[112],"0.85V/40nm":[113],"CMOS":[114],"which":[115],"well-suited":[117],"constrained":[120]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":3}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
