{"id":"https://openalex.org/W4385832149","doi":"https://doi.org/10.1109/tcsi.2023.3300657","title":"Optimizing FPGA-Based DNN Accelerator With Shared Exponential Floating-Point Format","display_name":"Optimizing FPGA-Based DNN Accelerator With Shared Exponential Floating-Point Format","publication_year":2023,"publication_date":"2023-08-15","ids":{"openalex":"https://openalex.org/W4385832149","doi":"https://doi.org/10.1109/tcsi.2023.3300657"},"language":"en","primary_location":{"id":"doi:10.1109/tcsi.2023.3300657","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2023.3300657","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006910313","display_name":"Wenzhe Zhao","orcid":"https://orcid.org/0000-0002-7001-2125"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wenzhe Zhao","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052924540","display_name":"Q. Dang","orcid":"https://orcid.org/0009-0006-0326-2999"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiwei Dang","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032104477","display_name":"Tian Xia","orcid":"https://orcid.org/0000-0002-2520-3731"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian Xia","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039426038","display_name":"Jingming Zhang","orcid":"https://orcid.org/0000-0002-0961-934X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jingming Zhang","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047405956","display_name":"Nanning Zheng","orcid":"https://orcid.org/0000-0003-1608-8257"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nanning Zheng","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044243518","display_name":"Pengju Ren","orcid":"https://orcid.org/0000-0003-1163-2014"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pengju Ren","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5006910313"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.0784,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.89182268,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"70","issue":"11","first_page":"4478","last_page":"4491"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.8366290330886841},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.8256268501281738},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7672044038772583},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6102105379104614},{"id":"https://openalex.org/keywords/fixed-point-arithmetic","display_name":"Fixed-point arithmetic","score":0.593603253364563},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5662953853607178},{"id":"https://openalex.org/keywords/digital-signal-processing","display_name":"Digital signal processing","score":0.5290022492408752},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.5059797167778015},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.43754467368125916},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.42109841108322144},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.357820600271225},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.35463863611221313},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.33194002509117126},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2735730707645416},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1933838129043579}],"concepts":[{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.8366290330886841},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.8256268501281738},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7672044038772583},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6102105379104614},{"id":"https://openalex.org/C163973906","wikidata":"https://www.wikidata.org/wiki/Q649900","display_name":"Fixed-point arithmetic","level":3,"score":0.593603253364563},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5662953853607178},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.5290022492408752},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.5059797167778015},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.43754467368125916},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.42109841108322144},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.357820600271225},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.35463863611221313},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.33194002509117126},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2735730707645416},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1933838129043579},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsi.2023.3300657","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2023.3300657","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5899999737739563,"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8"}],"awards":[{"id":"https://openalex.org/G1900829300","display_name":null,"funder_award_id":"2022YFB4500500","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G3833898155","display_name":null,"funder_award_id":"62088102","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8788828744","display_name":null,"funder_award_id":"2022ZDLGY01-08","funder_id":"https://openalex.org/F4320336350","funder_display_name":"Key Research and Development Projects of Shaanxi Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320336350","display_name":"Key Research and Development Projects of Shaanxi Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1622676895","https://openalex.org/W1932624639","https://openalex.org/W2094756095","https://openalex.org/W2097117768","https://openalex.org/W2621405616","https://openalex.org/W2750822049","https://openalex.org/W2787091153","https://openalex.org/W2795961274","https://openalex.org/W2803935332","https://openalex.org/W2861440650","https://openalex.org/W2883920103","https://openalex.org/W2914242365","https://openalex.org/W2914286461","https://openalex.org/W2936278485","https://openalex.org/W2936672709","https://openalex.org/W2946355854","https://openalex.org/W2952773607","https://openalex.org/W2963037989","https://openalex.org/W2998506323","https://openalex.org/W3009327594","https://openalex.org/W3015847664","https://openalex.org/W3018757597","https://openalex.org/W3091969046","https://openalex.org/W3118608800","https://openalex.org/W3122898200","https://openalex.org/W3130554079","https://openalex.org/W3162993841","https://openalex.org/W3202442802","https://openalex.org/W3212505503","https://openalex.org/W4205884968","https://openalex.org/W4285146087","https://openalex.org/W4285227098","https://openalex.org/W4285507310","https://openalex.org/W4296079299","https://openalex.org/W4297924675","https://openalex.org/W4312383953","https://openalex.org/W4312857960","https://openalex.org/W6620707391","https://openalex.org/W6738373677","https://openalex.org/W6751552315","https://openalex.org/W6767032739","https://openalex.org/W6774235683","https://openalex.org/W6776767859","https://openalex.org/W6785530804","https://openalex.org/W6787972765","https://openalex.org/W6788610620","https://openalex.org/W6790409148"],"related_works":["https://openalex.org/W3206224488","https://openalex.org/W2288960809","https://openalex.org/W1935080020","https://openalex.org/W2062935593","https://openalex.org/W965527374","https://openalex.org/W2586397364","https://openalex.org/W2111431984","https://openalex.org/W2059483066","https://openalex.org/W4249587008","https://openalex.org/W4230766544"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"low-precision":[3],"fixed-point":[4,33,153],"computation":[5],"has":[6,21],"become":[7],"a":[8,55],"widely":[9],"used":[10],"technique":[11],"for":[12,51],"neural":[13,26,58,107,176],"network":[14,59,108],"inference":[15,96],"on":[16,61,174,187],"FPGAs.":[17],"However,":[18],"this":[19,76,78,102,163],"approach":[20],"some":[22],"limitations,":[23],"as":[24,36,92,169],"certain":[25],"networks":[27,177],"are":[28],"difficult":[29],"to":[30,66,120,129,149],"quantify":[31],"using":[32],"arithmetic,":[34],"such":[35],"those":[37,150],"involved":[38],"in":[39,162],"super-resolution":[40],"scaling,":[41],"image":[42],"denoising,":[43],"and":[44,70,131,146,180],"other":[45],"scenarios":[46],"that":[47,86,110,158],"lack":[48],"sufficient":[49],"conditions":[50],"fine-tuning.":[52,100],"Furthermore,":[53],"deploying":[54],"floating-point":[56,83,138],"precision":[57],"directly":[60],"an":[62,81,105],"FPGA":[63],"would":[64],"lead":[65],"significant":[67],"hardware":[68],"overhead":[69],"low":[71],"computational":[72],"efficiency.":[73],"To":[74],"address":[75],"issue,":[77],"paper":[79,103],"proposes":[80],"FPGA-friendly":[82],"data":[84],"format":[85],"achieves":[87,142,165,193],"the":[88,114,122,133,159,166,170,188,191,201,205],"same":[89,167],"storage":[90],"density":[91],"int8":[93],"without":[94,178],"sacrificing":[95],"accuracy":[97,168],"or":[98],"requiring":[99],"Additionally,":[101],"presents":[104],"FPGA-based":[106],"accelerator":[109,160],"is":[111],"compatible":[112],"with":[113],"proposed":[115,161],"format,":[116],"utilizing":[117],"DSP":[118,125],"resources":[119],"increase":[121],"number":[123],"of":[124,137,151],"cascading":[126],"from":[127],"7":[128],"16,":[130],"solving":[132],"back-to-back":[134],"accumulation":[135],"issue":[136],"numbers.":[139],"This":[140],"design":[141],"comparable":[143],"resource":[144],"consumption":[145],"execution":[147],"efficiency":[148],"8-bit":[152],"accelerators.":[154],"Experimental":[155],"results":[156],"demonstrate":[157],"study":[164],"native":[171],"floating":[172],"point":[173],"multiple":[175],"fine-tuning,":[179],"remains":[181],"high":[182],"computing":[183],"performance.":[184],"When":[185],"deployed":[186],"Xilinx":[189,206],"ZU9P,":[190],"performance":[192],"4.072":[194],"TFlops":[195],"at":[196],"250":[197],"MHz,":[198],"which":[199],"outperforms":[200],"previous":[202],"works,":[203],"including":[204],"official":[207],"DPU.":[208]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
