{"id":"https://openalex.org/W4405112145","doi":"https://doi.org/10.1145/3707209","title":"FPGA-based Block Minifloat Training Accelerator for a Time Series Prediction Network","display_name":"FPGA-based Block Minifloat Training Accelerator for a Time Series Prediction Network","publication_year":2024,"publication_date":"2024-12-06","ids":{"openalex":"https://openalex.org/W4405112145","doi":"https://doi.org/10.1145/3707209"},"language":"en","primary_location":{"id":"doi:10.1145/3707209","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3707209","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3707209","source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Reconfigurable Technology and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3707209","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wenjie Zhou","orcid":"https://orcid.org/0009-0005-7145-1639"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Wenjie Zhou","raw_affiliation_strings":["Department of Electrical and Computer Engineering, The University of Sydney, Sydney, Australia","University of Sydney, Australia"],"raw_orcid":"https://orcid.org/0009-0005-7145-1639","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]},{"raw_affiliation_string":"University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008223884","display_name":"Haoyan Qi","orcid":null},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Haoyan Qi","raw_affiliation_strings":["Department of Electrical and Computer Engineering, The University of Sydney, Sydney, Australia","University of Sydney, Australia"],"raw_orcid":"https://orcid.org/0009-0005-6173-0466","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]},{"raw_affiliation_string":"University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040792997","display_name":"David Boland","orcid":"https://orcid.org/0000-0001-5370-4464"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"David Boland","raw_affiliation_strings":["Department of Electrical and Computer Engineering, The University of Sydney, Sydney, Australia","University of Sydney, Australia"],"raw_orcid":"https://orcid.org/0000-0001-5370-4464","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]},{"raw_affiliation_string":"University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5107994859","display_name":"Philip H. W. Leong","orcid":"https://orcid.org/0000-0002-3923-3499"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Philip H. W. Leong","raw_affiliation_strings":["Department of Electrical and Computer Engineering, The University of Sydney, Sydney, Australia","University of Sydney, Australia"],"raw_orcid":"https://orcid.org/0000-0002-3923-3499","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, The University of Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]},{"raw_affiliation_string":"University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I129604602"],"apc_list":null,"apc_paid":null,"fwci":0.6294,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.75932429,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"18","issue":"2","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8892086148262024},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5859768986701965},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.5683839917182922},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.565752387046814},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5523197054862976},{"id":"https://openalex.org/keywords/lookup-table","display_name":"Lookup table","score":0.5464358329772949},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.5304994583129883},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.5144972801208496},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.5134197473526001},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.5121971964836121},{"id":"https://openalex.org/keywords/digital-signal-processing","display_name":"Digital signal processing","score":0.49811363220214844},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.46639272570610046},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.4650287330150604},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.4437195360660553},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4280807077884674},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.35623234510421753},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3516884446144104},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34127458930015564},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2653798460960388},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.10990360379219055},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.10360777378082275}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8892086148262024},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5859768986701965},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.5683839917182922},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.565752387046814},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5523197054862976},{"id":"https://openalex.org/C134835016","wikidata":"https://www.wikidata.org/wiki/Q690265","display_name":"Lookup table","level":2,"score":0.5464358329772949},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.5304994583129883},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.5144972801208496},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.5134197473526001},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.5121971964836121},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.49811363220214844},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.46639272570610046},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.4650287330150604},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.4437195360660553},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4280807077884674},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.35623234510421753},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3516884446144104},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34127458930015564},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2653798460960388},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.10990360379219055},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.10360777378082275},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3707209","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3707209","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3707209","source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Reconfigurable Technology and Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3707209","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3707209","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3707209","source":{"id":"https://openalex.org/S112809824","display_name":"ACM Transactions on Reconfigurable Technology and Systems","issn_l":"1936-7406","issn":["1936-7406","1936-7414"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Reconfigurable Technology and Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.9100000262260437,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4405112145.pdf"},"referenced_works_count":26,"referenced_works":["https://openalex.org/W1482147200","https://openalex.org/W2808800115","https://openalex.org/W2888546126","https://openalex.org/W2889797931","https://openalex.org/W2890068895","https://openalex.org/W2913707927","https://openalex.org/W2917518248","https://openalex.org/W2949833565","https://openalex.org/W2963459284","https://openalex.org/W2970821029","https://openalex.org/W3004303566","https://openalex.org/W3101100041","https://openalex.org/W3112412839","https://openalex.org/W3160017297","https://openalex.org/W3208633927","https://openalex.org/W3212505503","https://openalex.org/W4206557440","https://openalex.org/W4229896786","https://openalex.org/W4233996382","https://openalex.org/W4240862739","https://openalex.org/W4251309856","https://openalex.org/W4296914491","https://openalex.org/W4364859988","https://openalex.org/W4389163044","https://openalex.org/W4391429622","https://openalex.org/W6751609549"],"related_works":["https://openalex.org/W4322761281","https://openalex.org/W4238233472","https://openalex.org/W3111395152","https://openalex.org/W4313526662","https://openalex.org/W4313463218","https://openalex.org/W3106131444","https://openalex.org/W3216099748","https://openalex.org/W4205963435","https://openalex.org/W4312996489","https://openalex.org/W3214037210"],"abstract_inverted_index":{"Time":[0],"series":[1,98],"forecasting":[2],"is":[3,135],"the":[4,34,52,56,122],"problem":[5],"of":[6,128],"predicting":[7],"future":[8],"data":[9],"samples":[10],"from":[11],"historical":[12],"information":[13],"and":[14,40,71],"recent":[15],"deep":[16],"neural":[17],"network":[18],"(DNNs)":[19],"based":[20],"techniques":[21],"have":[22,43],"achieved":[23],"excellent":[24],"results":[25],"compared":[26],"with":[27],"conventional":[28],"statistical":[29],"approaches.":[30],"Many":[31],"applications":[32,77],"at":[33,51],"edge":[35,53,76],"can":[36],"utilize":[37],"this":[38,85],"technology":[39],"most":[41],"implementations":[42],"focused":[44],"on":[45],"inference,":[46],"an":[47],"ability":[48],"to":[49,58,60,120],"train":[50],"would":[54],"enable":[55],"DNN":[57],"adapt":[59],"changing":[61],"conditions.":[62],"Unfortunately,":[63],"training":[64,93],"requires":[65],"approximately":[66],"three":[67],"times":[68],"more":[69],"memory":[70],"computation":[72],"than":[73,141],"inference.":[74],"Moreover,":[75],"are":[78],"often":[79],"constrained":[80],"by":[81],"energy":[82],"efficiency.":[83],"In":[84],"work,":[86],"we":[87],"implement":[88],"a":[89,96,105,115,126,142,147],"block":[90],"minifloat":[91],"(BM)":[92],"accelerator":[94,108],"for":[95],"time":[97],"prediction":[99],"network,":[100],"N-BEATS.":[101],"Our":[102],"architecture":[103],"involves":[104],"mixed-precision":[106],"GEMM":[107],"that":[109],"utilizes":[110],"BM":[111],"arithmetic.":[112],"We":[113],"use":[114],"4-bit":[116],"DSP":[117],"packing":[118],"scheme":[119],"optimize":[121],"implementation":[123],"further,":[124],"achieving":[125],"throughput":[127],"779":[129],"Gops.":[130],"The":[131],"resulting":[132],"power":[133],"efficiency":[134],"42.4":[136],"Gops/W,":[137],"3.1":[138],"\\(\\times\\)":[139],"better":[140],"graphics":[143],"processing":[144],"unit":[145],"in":[146],"similar":[148],"technology.":[149]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
