{"id":"https://openalex.org/W2971734772","doi":"https://doi.org/10.1109/tvlsi.2019.2935251","title":"An Energy-Efficient Deep Convolutional Neural Network Inference Processor With Enhanced Output Stationary Dataflow in 65-nm CMOS","display_name":"An Energy-Efficient Deep Convolutional Neural Network Inference Processor With Enhanced Output Stationary Dataflow in 65-nm CMOS","publication_year":2019,"publication_date":"2019-09-03","ids":{"openalex":"https://openalex.org/W2971734772","doi":"https://doi.org/10.1109/tvlsi.2019.2935251","mag":"2971734772"},"language":"en","primary_location":{"id":"doi:10.1109/tvlsi.2019.2935251","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvlsi.2019.2935251","pdf_url":null,"source":{"id":"https://openalex.org/S37538908","display_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","issn_l":"1063-8210","issn":["1063-8210","1557-9999"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013362846","display_name":"Jaehyeong Sim","orcid":"https://orcid.org/0000-0001-8722-8486"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jaehyeong Sim","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101594395","display_name":"Somin Lee","orcid":"https://orcid.org/0000-0001-9189-0384"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]},{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Somin Lee","raw_affiliation_strings":["Samsung Electronics, Hwasung, South Korea","School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"Samsung Electronics, Hwasung, South Korea","institution_ids":["https://openalex.org/I2250650973"]},{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052390471","display_name":"Lee\u2010Sup Kim","orcid":"https://orcid.org/0000-0001-9585-4591"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Lee-Sup Kim","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5013362846"],"corresponding_institution_ids":["https://openalex.org/I157485424"],"apc_list":null,"apc_paid":null,"fwci":4.0538,"has_fulltext":false,"cited_by_count":56,"citation_normalized_percentile":{"value":0.94492191,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"28","issue":"1","first_page":"87","last_page":"100"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.7978359460830688},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7524492740631104},{"id":"https://openalex.org/keywords/static-random-access-memory","display_name":"Static random-access memory","score":0.7396050095558167},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5362464785575867},{"id":"https://openalex.org/keywords/cmos","display_name":"CMOS","score":0.5265291929244995},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5158799886703491},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.4611648917198181},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4562593102455139},{"id":"https://openalex.org/keywords/chip","display_name":"Chip","score":0.4497907757759094},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.44779112935066223},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.4422233998775482},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.41834068298339844},{"id":"https://openalex.org/keywords/electronic-engineering","display_name":"Electronic engineering","score":0.22508707642555237},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1850517988204956},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.13085150718688965},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1080925464630127},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.0968180000782013},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.08769232034683228}],"concepts":[{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.7978359460830688},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7524492740631104},{"id":"https://openalex.org/C68043766","wikidata":"https://www.wikidata.org/wiki/Q267416","display_name":"Static random-access memory","level":2,"score":0.7396050095558167},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5362464785575867},{"id":"https://openalex.org/C46362747","wikidata":"https://www.wikidata.org/wiki/Q173431","display_name":"CMOS","level":2,"score":0.5265291929244995},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5158799886703491},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.4611648917198181},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4562593102455139},{"id":"https://openalex.org/C165005293","wikidata":"https://www.wikidata.org/wiki/Q1074500","display_name":"Chip","level":2,"score":0.4497907757759094},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.44779112935066223},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.4422233998775482},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.41834068298339844},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.22508707642555237},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1850517988204956},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.13085150718688965},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1080925464630127},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.0968180000782013},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.08769232034683228},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tvlsi.2019.2935251","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvlsi.2019.2935251","pdf_url":null,"source":{"id":"https://openalex.org/S37538908","display_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","issn_l":"1063-8210","issn":["1063-8210","1557-9999"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.9100000262260437}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322091","display_name":"Korea Institute of Science and Technology","ror":"https://ror.org/05kzfa883"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320322202","display_name":"IC Design Education Center","ror":"https://ror.org/005v57z85"},{"id":"https://openalex.org/F4320324161","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1998525920","https://openalex.org/W1999085092","https://openalex.org/W2002038549","https://openalex.org/W2048266589","https://openalex.org/W2067392247","https://openalex.org/W2067523571","https://openalex.org/W2094756095","https://openalex.org/W2108598243","https://openalex.org/W2109846948","https://openalex.org/W2152839228","https://openalex.org/W2163605009","https://openalex.org/W2168159483","https://openalex.org/W2194775991","https://openalex.org/W2289252105","https://openalex.org/W2290132443","https://openalex.org/W2310042802","https://openalex.org/W2388355420","https://openalex.org/W2440384215","https://openalex.org/W2442974303","https://openalex.org/W2515287984","https://openalex.org/W2520083297","https://openalex.org/W2593564159","https://openalex.org/W2594492285","https://openalex.org/W2594836184","https://openalex.org/W2604319603","https://openalex.org/W2605487586","https://openalex.org/W2612445135","https://openalex.org/W2767864757","https://openalex.org/W2792607576","https://openalex.org/W2793950911","https://openalex.org/W2794141774","https://openalex.org/W2794260578","https://openalex.org/W2963893493","https://openalex.org/W3024621361","https://openalex.org/W3118608800","https://openalex.org/W4238999275","https://openalex.org/W4297775537","https://openalex.org/W4387007199","https://openalex.org/W6637373629","https://openalex.org/W6667544498","https://openalex.org/W6684191040","https://openalex.org/W6698500090","https://openalex.org/W6734592959","https://openalex.org/W6735008196","https://openalex.org/W6737664043","https://openalex.org/W6749677685","https://openalex.org/W6787972765","https://openalex.org/W6856891780"],"related_works":["https://openalex.org/W2998381397","https://openalex.org/W4236419692","https://openalex.org/W3167919718","https://openalex.org/W4239447582","https://openalex.org/W2171015181","https://openalex.org/W4225271228","https://openalex.org/W1484403103","https://openalex.org/W2521947294","https://openalex.org/W2907307640","https://openalex.org/W2119025037"],"abstract_inverted_index":{"We":[0],"propose":[1],"a":[2,12,73],"deep":[3],"convolutional":[4],"neural":[5],"network":[6],"(CNN)":[7],"inference":[8],"processor":[9,88,144],"based":[10],"on":[11,20],"novel":[13],"enhanced":[14],"output":[15],"stationary":[16],"(EOS)":[17],"dataflow.":[18],"Based":[19],"the":[21,33,81,115,118],"observation":[22],"that":[23,69,142],"some":[24],"activations":[25],"are":[26,62],"commonly":[27],"used":[28],"in":[29],"two":[30,90],"successive":[31],"convolutions,":[32],"EOS":[34],"dataflow":[35],"employs":[36],"dedicated":[37],"register":[38],"files":[39],"(RFs)":[40],"for":[41,52],"storing":[42],"such":[43,68],"reused":[44],"activation":[45,77,84],"data":[46],"to":[47,79,110,130],"eliminate":[48],"redundant":[49],"memory":[50,136],"accesses":[51],"highly":[53],"energy-consuming":[54],"SRAM":[55],"banks.":[56],"In":[57],"addition,":[58],"processing":[59],"elements":[60],"(PEs)":[61],"split":[63],"into":[64],"multiple":[65],"small":[66],"groups":[67],"each":[70],"group":[71],"covers":[72],"tile":[74],"of":[75,83,117,147],"input":[76],"map":[78],"increase":[80,111,131],"usability":[82],"RFs":[85],"(ARFs).":[86],"The":[87,94,138],"has":[89],"different":[91],"voltage/frequency":[92],"domains.":[93],"computation":[95],"domain":[96],"with":[97],"512":[98],"PEs":[99],"operates":[100],"at":[101,124,150,154,158,163],"near-threshold":[102],"voltage":[103],"(NTV)":[104],"(0.4":[105],"V)":[106],"and":[107,127,134,161],"60-MHz":[108],"frequency":[109,129],"energy":[112,166],"efficiency,":[113],"while":[114],"rest":[116],"processors":[119],"including":[120],"848-KB":[121],"SRAMs":[122],"run":[123],"0.7":[125],"V":[126],"120-MHz":[128],"both":[132],"on-chip":[133],"off-chip":[135],"bandwidths.":[137],"measurement":[139],"results":[140],"show":[141],"our":[143],"is":[145],"capable":[146],"running":[148],"AlexNet":[149],"831":[151],"GOPS/W,":[152,156,160],"VGG-16":[153],"1151":[155],"ResNet-18":[157],"1004":[159],"MobileNet":[162],"948":[164],"GOPS/W":[165],"efficiency.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":10},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":14},{"year":2021,"cited_by_count":14},{"year":2020,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
