{"id":"https://openalex.org/W4409560185","doi":"https://doi.org/10.1109/tcsi.2025.3554635","title":"A High-Throughput FPGA Accelerator for Lightweight CNNs With Balanced Dataflow","display_name":"A High-Throughput FPGA Accelerator for Lightweight CNNs With Balanced Dataflow","publication_year":2025,"publication_date":"2025-04-17","ids":{"openalex":"https://openalex.org/W4409560185","doi":"https://doi.org/10.1109/tcsi.2025.3554635"},"language":"en","primary_location":{"id":"doi:10.1109/tcsi.2025.3554635","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2025.3554635","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Zhiyuan Zhao","orcid":"https://orcid.org/0009-0003-2884-2314"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiyuan Zhao","raw_affiliation_strings":["School of Microelectronics, University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0009-0003-2884-2314","affiliations":[{"raw_affiliation_string":"School of Microelectronics, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yihao Chen","orcid":"https://orcid.org/0009-0001-2723-200X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210149211","display_name":"Institute of Semiconductors","ror":"https://ror.org/048dd0611","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210149211"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yihao Chen","raw_affiliation_strings":["Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0001-2723-200X","affiliations":[{"raw_affiliation_string":"Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210149211","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114960823","display_name":"Pengcheng Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210149211","display_name":"Institute of Semiconductors","ror":"https://ror.org/048dd0611","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210149211"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengcheng Feng","raw_affiliation_strings":["Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210149211","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101944976","display_name":"Jixing Li","orcid":"https://orcid.org/0000-0002-1820-2087"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210149211","display_name":"Institute of Semiconductors","ror":"https://ror.org/048dd0611","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210149211"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jixing Li","raw_affiliation_strings":["Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-1820-2087","affiliations":[{"raw_affiliation_string":"Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210149211","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100389323","display_name":"Gang Chen","orcid":"https://orcid.org/0000-0003-3157-0172"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210149211","display_name":"Institute of Semiconductors","ror":"https://ror.org/048dd0611","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210149211"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Chen","raw_affiliation_strings":["Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3157-0172","affiliations":[{"raw_affiliation_string":"Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210149211","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003118572","display_name":"Rongxuan Shen","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210149211","display_name":"Institute of Semiconductors","ror":"https://ror.org/048dd0611","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210149211"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rongxuan Shen","raw_affiliation_strings":["Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210149211","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050306282","display_name":"Huaxiang Lu","orcid":"https://orcid.org/0000-0002-5928-9705"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210149211","display_name":"Institute of Semiconductors","ror":"https://ror.org/048dd0611","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210149211"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huaxiang Lu","raw_affiliation_strings":["Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5928-9705","affiliations":[{"raw_affiliation_string":"Institute of Semiconductors, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210149211","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":4.533,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.94374716,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"72","issue":"7","first_page":"3338","last_page":"3351"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9794999957084656,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.9093238115310669},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.8160660266876221},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.786573052406311},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6918567419052124},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.4599124789237976},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.45540010929107666},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.4308892488479614},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.4071301221847534},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.23907357454299927}],"concepts":[{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.9093238115310669},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.8160660266876221},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.786573052406311},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6918567419052124},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.4599124789237976},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.45540010929107666},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.4308892488479614},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.4071301221847534},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.23907357454299927},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsi.2025.3554635","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2025.3554635","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.5799999833106995}],"awards":[{"id":"https://openalex.org/G1411627799","display_name":null,"funder_award_id":"XDB44000000","funder_id":"https://openalex.org/F4320321133","funder_display_name":"Chinese Academy of Sciences"}],"funders":[{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W2112796928","https://openalex.org/W2126468361","https://openalex.org/W2194775991","https://openalex.org/W2466675884","https://openalex.org/W2883780447","https://openalex.org/W2883927138","https://openalex.org/W2887936511","https://openalex.org/W2907579173","https://openalex.org/W2933438941","https://openalex.org/W2935524202","https://openalex.org/W2945146780","https://openalex.org/W2951898149","https://openalex.org/W2963125010","https://openalex.org/W2963163009","https://openalex.org/W2974135602","https://openalex.org/W2981751377","https://openalex.org/W3000434371","https://openalex.org/W3008408165","https://openalex.org/W3082058622","https://openalex.org/W3093796669","https://openalex.org/W3127242686","https://openalex.org/W3132745255","https://openalex.org/W3161542527","https://openalex.org/W3162993841","https://openalex.org/W3164217046","https://openalex.org/W3206196385","https://openalex.org/W4205811585","https://openalex.org/W4205884968","https://openalex.org/W4214870144","https://openalex.org/W4221159612","https://openalex.org/W4291910419","https://openalex.org/W4297775537","https://openalex.org/W4312426786","https://openalex.org/W4312646647","https://openalex.org/W4389722504","https://openalex.org/W4390337077","https://openalex.org/W4400230149","https://openalex.org/W4400811497","https://openalex.org/W4401386645","https://openalex.org/W4401935077","https://openalex.org/W4404101766","https://openalex.org/W6637373629","https://openalex.org/W6737664043","https://openalex.org/W6810281471"],"related_works":["https://openalex.org/W2293118914","https://openalex.org/W2998381397","https://openalex.org/W4236419692","https://openalex.org/W2171015181","https://openalex.org/W3167919718","https://openalex.org/W2999668243","https://openalex.org/W1998888015","https://openalex.org/W1967938402","https://openalex.org/W2386041993","https://openalex.org/W1608572506"],"abstract_inverted_index":{"FPGA":[0],"accelerators":[1,16],"for":[2,101],"lightweight":[3],"convolutional":[4],"neural":[5],"networks":[6],"(LWCNNs)":[7],"have":[8],"recently":[9],"attracted":[10],"significant":[11],"attention.":[12],"Most":[13],"existing":[14],"LWCNN":[15,65,208],"focus":[17],"on":[18,128,143],"single-Computing-Engine":[19],"(CE)":[20],"architecture":[21,74],"with":[22,57,75,167],"local":[23],"optimization.":[24],"However,":[25],"these":[26,51],"designs":[27],"typically":[28],"suffer":[29],"from":[30],"high":[31,199],"on-chip/off-chip":[32],"memory":[33,83,120,165,170],"overhead":[34],"and":[35,44,68,113,121,136,149,187],"low":[36,88],"computational":[37,106],"efficiency":[38,107,191],"due":[39],"to":[40,62,80,104,132,161,173,184,194],"their":[41],"layer-by-layer":[42],"dataflow":[43,59,97],"unified":[45],"resource":[46,111],"mapping":[47,112],"mechanisms.":[48],"To":[49],"tackle":[50],"issues,":[52],"a":[53,72,87,95,118,129,188,198],"novel":[54],"multi-CE-based":[55],"accelerator":[56,140,157],"balanced":[58,96],"is":[60,78,99,125,141],"proposed":[61,139,156],"efficiently":[63],"accelerate":[64],"through":[66],"memory-oriented":[67],"computing-oriented":[69],"optimizations.":[70],"Firstly,":[71],"streaming":[73,102],"hybrid":[76],"CEs":[77],"designed":[79],"minimize":[81],"off-chip":[82,169],"access":[84,171],"while":[85,196],"maintaining":[86,197],"cost":[89],"of":[90,163,182,192,202],"on-chip":[91,164],"buffer":[92],"size.":[93],"Secondly,":[94],"strategy":[98],"introduced":[100],"architectures":[103],"enhance":[105],"by":[108],"improving":[109],"efficient":[110],"mitigating":[114],"data":[115],"congestion.":[116],"Furthermore,":[117],"resource-aware":[119],"parallelism":[122],"allocation":[123],"methodology":[124],"proposed,":[126],"based":[127],"performance":[130,135,181],"model,":[131],"achieve":[133],"better":[134],"scalability.":[137],"The":[138],"evaluated":[142],"Xilinx":[144],"ZC706":[145],"platform":[146],"using":[147],"MobileNetV2":[148],"ShuffleNetV2.":[150],"Implementation":[151],"results":[152],"demonstrate":[153],"that":[154],"the":[155,174],"can":[158],"save":[159],"up":[160,183,193],"68.3%":[162],"size":[166],"reduced":[168],"compared":[172],"reference":[175],"design.":[176],"It":[177],"achieves":[178],"an":[179],"impressive":[180],"2092.4":[185],"FPS":[186],"state-of-the-art":[189],"MAC":[190],"94.58%,":[195],"DSP":[200],"utilization":[201],"95%,":[203],"thus":[204],"significantly":[205],"outperforming":[206],"current":[207],"accelerators.":[209]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
