{"id":"https://openalex.org/W3123687588","doi":"https://doi.org/10.1109/lca.2021.3054371","title":"Row-Streaming Dataflow Using a Chaining Buffer and Systolic Array+ Structure","display_name":"Row-Streaming Dataflow Using a Chaining Buffer and Systolic Array+ Structure","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3123687588","doi":"https://doi.org/10.1109/lca.2021.3054371","mag":"3123687588"},"language":"en","primary_location":{"id":"doi:10.1109/lca.2021.3054371","is_oa":true,"landing_page_url":"https://doi.org/10.1109/lca.2021.3054371","pdf_url":"https://ieeexplore.ieee.org/ielx7/10208/9313849/09336234.pdf","source":{"id":"https://openalex.org/S17643076","display_name":"IEEE Computer Architecture Letters","issn_l":"1556-6056","issn":["1556-6056","1556-6064","2473-2575"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computer Architecture Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ieeexplore.ieee.org/ielx7/10208/9313849/09336234.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060526894","display_name":"Hweesoo Kim","orcid":"https://orcid.org/0000-0002-5147-0972"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Hweesoo Kim","raw_affiliation_strings":["Department of Intelligence and Information & Inter-University Semiconductor Research Center, Seoul National University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Intelligence and Information & Inter-University Semiconductor Research Center, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025001772","display_name":"Sunjung Lee","orcid":"https://orcid.org/0000-0002-5177-0916"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sunjung Lee","raw_affiliation_strings":["Department of Intelligence and Information & Inter-University Semiconductor Research Center, Seoul National University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Intelligence and Information & Inter-University Semiconductor Research Center, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032839104","display_name":"Jaewan Choi","orcid":"https://orcid.org/0000-0003-2447-4369"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaewan Choi","raw_affiliation_strings":["Department of Intelligence and Information & Inter-University Semiconductor Research Center, Seoul National University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Intelligence and Information & Inter-University Semiconductor Research Center, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078262826","display_name":"Jung Ho Ahn","orcid":"https://orcid.org/0000-0003-1733-1394"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jung Ho Ahn","raw_affiliation_strings":["Department of Intelligence and Information & Inter-University Semiconductor Research Center, Seoul National University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Intelligence and Information & Inter-University Semiconductor Research Center, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5060526894"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":null,"apc_paid":null,"fwci":0.5826,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.67047988,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"20","issue":"1","first_page":"34","last_page":"37"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.838417649269104},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.7446907758712769},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6448025703430176},{"id":"https://openalex.org/keywords/chaining","display_name":"Chaining","score":0.6080555319786072},{"id":"https://openalex.org/keywords/systolic-array","display_name":"Systolic array","score":0.5654763579368591},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5275881886482239},{"id":"https://openalex.org/keywords/column","display_name":"Column (typography)","score":0.5004959106445312},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4879912734031677},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.44222739338874817},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4336364269256592},{"id":"https://openalex.org/keywords/chip","display_name":"Chip","score":0.41413113474845886},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.35791921615600586},{"id":"https://openalex.org/keywords/very-large-scale-integration","display_name":"Very-large-scale integration","score":0.2720378041267395},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.22288495302200317},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.18732541799545288},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.12946957349777222},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.09023377299308777}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.838417649269104},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.7446907758712769},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6448025703430176},{"id":"https://openalex.org/C49020025","wikidata":"https://www.wikidata.org/wiki/Q1059099","display_name":"Chaining","level":2,"score":0.6080555319786072},{"id":"https://openalex.org/C150741067","wikidata":"https://www.wikidata.org/wiki/Q2377218","display_name":"Systolic array","level":3,"score":0.5654763579368591},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5275881886482239},{"id":"https://openalex.org/C2780551164","wikidata":"https://www.wikidata.org/wiki/Q2306599","display_name":"Column (typography)","level":3,"score":0.5004959106445312},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4879912734031677},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.44222739338874817},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4336364269256592},{"id":"https://openalex.org/C165005293","wikidata":"https://www.wikidata.org/wiki/Q1074500","display_name":"Chip","level":2,"score":0.41413113474845886},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.35791921615600586},{"id":"https://openalex.org/C14580979","wikidata":"https://www.wikidata.org/wiki/Q876049","display_name":"Very-large-scale integration","level":2,"score":0.2720378041267395},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.22288495302200317},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18732541799545288},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.12946957349777222},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.09023377299308777},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lca.2021.3054371","is_oa":true,"landing_page_url":"https://doi.org/10.1109/lca.2021.3054371","pdf_url":"https://ieeexplore.ieee.org/ielx7/10208/9313849/09336234.pdf","source":{"id":"https://openalex.org/S17643076","display_name":"IEEE Computer Architecture Letters","issn_l":"1556-6056","issn":["1556-6056","1556-6064","2473-2575"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computer Architecture Letters","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/lca.2021.3054371","is_oa":true,"landing_page_url":"https://doi.org/10.1109/lca.2021.3054371","pdf_url":"https://ieeexplore.ieee.org/ielx7/10208/9313849/09336234.pdf","source":{"id":"https://openalex.org/S17643076","display_name":"IEEE Computer Architecture Letters","issn_l":"1556-6056","issn":["1556-6056","1556-6064","2473-2575"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computer Architecture Letters","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.9100000262260437,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G3338737308","display_name":null,"funder_award_id":"NRF-2018R1A5A1059921","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G342704958","display_name":null,"funder_award_id":"funded","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G690756877","display_name":null,"funder_award_id":"105992","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"},{"id":"https://openalex.org/G8190487336","display_name":null,"funder_award_id":"2018R1A5A1059921","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G982292920","display_name":null,"funder_award_id":"NRF-20","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320315121","display_name":"Samsung Advanced Institute of Technology","ror":null},{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320322202","display_name":"IC Design Education Center","ror":"https://ror.org/005v57z85"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"},{"id":"https://openalex.org/F4320332195","display_name":"Samsung","ror":"https://ror.org/04w3jy968"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3123687588.pdf","grobid_xml":"https://content.openalex.org/works/W3123687588.grobid-xml"},"referenced_works_count":11,"referenced_works":["https://openalex.org/W1999085092","https://openalex.org/W2100799944","https://openalex.org/W2194775991","https://openalex.org/W2289252105","https://openalex.org/W2604319603","https://openalex.org/W2606722458","https://openalex.org/W2790925711","https://openalex.org/W2963446712","https://openalex.org/W3102337469","https://openalex.org/W3145579537","https://openalex.org/W6786262024"],"related_works":["https://openalex.org/W2022229285","https://openalex.org/W46448156","https://openalex.org/W2283084692","https://openalex.org/W2130878144","https://openalex.org/W3172158163","https://openalex.org/W2150609674","https://openalex.org/W2138404091","https://openalex.org/W3034729708","https://openalex.org/W2078475991","https://openalex.org/W2112810905"],"abstract_inverted_index":{"Convolutional":[0,23],"Neural":[1],"Networks":[2],"(CNNs)":[3],"are":[4,26],"widely":[5],"used":[6],"to":[7,40,67,148,160,186],"solve":[8],"complex":[9],"problems":[10],"in":[11,130,163,168,177,189,194],"various":[12,35],"fields,":[13],"such":[14],"as":[15,72],"image":[16,18],"recognition,":[17],"classification,":[19],"and":[20,93,117,134,165,179,191],"video":[21],"analysis.":[22],"(CONV)":[24],"layers":[25],"the":[27,32,127,131,135,139,145,149,155,182],"most":[28],"computational":[29],"part":[30],"of":[31,50,54,97,174],"CNN":[33],"inference;":[34],"architectures":[36],"have":[37],"been":[38],"proposed":[39,146],"process":[41,68],"it":[42],"efficiently.":[43],"Among":[44],"those,":[45],"a":[46,51,69,73,89,94,107,114,118],"systolic":[47,108],"array":[48,53],"consists":[49],"2D":[52],"processing":[55],"elements,":[56],"which":[57,79],"handle":[58],"GEneral":[59],"Matrix":[60],"Multiplication":[61],"(GEMM)":[62],"with":[63,113,170],"high":[64],"efficiency.":[65],"However,":[66],"CONV":[70,132,151],"layer":[71,133],"GEMM":[74],"type,":[75],"image-to-column":[76],"(im2col)":[77],"processing,":[78],"is":[80,84],"also":[81],"called":[82],"lowering,":[83],"required":[85],"per":[86],"layer,":[87],"necessitating":[88],"larger":[90],"on-chip":[91,99,141],"memory":[92,100],"considerable":[95],"amount":[96],"repetitive":[98,136],"access.":[101],"In":[102],"this":[103],"letter,":[104],"we":[105,153,180],"propose":[106],"array+":[109],"(SysAr+)":[110],"structure":[111],"augmented":[112],"chaining":[115],"buffer":[116],"row-streaming":[119],"dataflow":[120],"that":[121],"can":[122],"maximize":[123],"data":[124],"reuse":[125],"without":[126],"im2col":[128],"pre-process":[129],"access":[137],"from":[138],"large":[140],"memory.":[142],"By":[143],"applying":[144],"method":[147],"3\u00d73":[150],"layers,":[152],"reduce":[154],"energy":[156],"consumption":[157],"by":[158,184],"up":[159,185],"19.7":[161],"percent":[162,167,176,188,193],"ResNet":[164,190],"37.4":[166],"DenseNet":[169],"an":[171],"area":[172],"overhead":[173],"1.54":[175],"SysAr+,":[178],"improve":[181],"performance":[183],"32.4":[187],"12.1":[192],"DenseNet.":[195]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
