{"id":"https://openalex.org/W4312247188","doi":"https://doi.org/10.1109/tcsi.2022.3214528","title":"Accelerating Deep Convolutional Neural Networks Using Number Theoretic Transform","display_name":"Accelerating Deep Convolutional Neural Networks Using Number Theoretic Transform","publication_year":2022,"publication_date":"2022-11-03","ids":{"openalex":"https://openalex.org/W4312247188","doi":"https://doi.org/10.1109/tcsi.2022.3214528"},"language":"en","primary_location":{"id":"doi:10.1109/tcsi.2022.3214528","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2022.3214528","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038968038","display_name":"Prasetiyo Prasetiyo","orcid":null},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Prasetiyo","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075135160","display_name":"Seongmin Hong","orcid":"https://orcid.org/0000-0001-6904-8094"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seongmin Hong","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044869676","display_name":"Yashael Faith Arthanto","orcid":null},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yashael Faith Arthanto","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100447377","display_name":"Joo-Young Kim","orcid":"https://orcid.org/0000-0003-1099-1496"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Joo-Young Kim","raw_affiliation_strings":["School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5038968038"],"corresponding_institution_ids":["https://openalex.org/I157485424"],"apc_list":null,"apc_paid":null,"fwci":1.4086,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.82916511,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"70","issue":"1","first_page":"315","last_page":"326"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.738318920135498},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6948959827423096},{"id":"https://openalex.org/keywords/fast-fourier-transform","display_name":"Fast Fourier transform","score":0.5784060955047607},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.5717682242393494},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5515885949134827},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5013599395751953},{"id":"https://openalex.org/keywords/discrete-fourier-transform","display_name":"Discrete Fourier transform (general)","score":0.4702295958995819},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.452709823846817},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4213762879371643},{"id":"https://openalex.org/keywords/fourier-transform","display_name":"Fourier transform","score":0.30441635847091675},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.2822006344795227},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.28042834997177124},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27914348244667053},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16687101125717163},{"id":"https://openalex.org/keywords/fractional-fourier-transform","display_name":"Fractional Fourier transform","score":0.13775920867919922}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.738318920135498},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6948959827423096},{"id":"https://openalex.org/C75172450","wikidata":"https://www.wikidata.org/wiki/Q623950","display_name":"Fast Fourier transform","level":2,"score":0.5784060955047607},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.5717682242393494},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5515885949134827},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5013599395751953},{"id":"https://openalex.org/C57733114","wikidata":"https://www.wikidata.org/wiki/Q1006032","display_name":"Discrete Fourier transform (general)","level":5,"score":0.4702295958995819},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.452709823846817},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4213762879371643},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.30441635847091675},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2822006344795227},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.28042834997177124},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27914348244667053},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16687101125717163},{"id":"https://openalex.org/C76563020","wikidata":"https://www.wikidata.org/wiki/Q4817582","display_name":"Fractional Fourier transform","level":4,"score":0.13775920867919922},{"id":"https://openalex.org/C203024314","wikidata":"https://www.wikidata.org/wiki/Q1365258","display_name":"Fourier analysis","level":3,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsi.2022.3214528","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsi.2022.3214528","pdf_url":null,"source":{"id":"https://openalex.org/S116977442","display_name":"IEEE Transactions on Circuits and Systems I Regular Papers","issn_l":"1549-8328","issn":["1549-8328","1558-0806"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems I: Regular Papers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4699999988079071,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[{"id":"https://openalex.org/G5093699767","display_name":null,"funder_award_id":"2021M3H6A1017683","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W2094756095","https://openalex.org/W2097117768","https://openalex.org/W2172654076","https://openalex.org/W2276486856","https://openalex.org/W2285660444","https://openalex.org/W2442974303","https://openalex.org/W2570343428","https://openalex.org/W2584311934","https://openalex.org/W2584616277","https://openalex.org/W2783720762","https://openalex.org/W2786845740","https://openalex.org/W2792503273","https://openalex.org/W2795915628","https://openalex.org/W2808739938","https://openalex.org/W2913221350","https://openalex.org/W2914725495","https://openalex.org/W2916484109","https://openalex.org/W2963122961","https://openalex.org/W2964525696","https://openalex.org/W2977634443","https://openalex.org/W3000160544","https://openalex.org/W3005924570","https://openalex.org/W3007444108","https://openalex.org/W3008408165","https://openalex.org/W3018618942","https://openalex.org/W3098382995","https://openalex.org/W3122230257","https://openalex.org/W3132745255","https://openalex.org/W3134012069","https://openalex.org/W3147354744","https://openalex.org/W3158912502","https://openalex.org/W3159196909","https://openalex.org/W3171251238","https://openalex.org/W3193946904","https://openalex.org/W3216623900","https://openalex.org/W4205884968","https://openalex.org/W4237812669","https://openalex.org/W4243682116","https://openalex.org/W4250640407","https://openalex.org/W4288413318","https://openalex.org/W6637373629","https://openalex.org/W6767597771","https://openalex.org/W6789862346"],"related_works":["https://openalex.org/W2154006536","https://openalex.org/W2348800014","https://openalex.org/W2365391860","https://openalex.org/W3034421924","https://openalex.org/W2982536526","https://openalex.org/W4386858688","https://openalex.org/W1820187807","https://openalex.org/W4380302312","https://openalex.org/W4390971171","https://openalex.org/W4362564158"],"abstract_inverted_index":{"Modern":[0],"deep":[1,167],"convolutional":[2],"neural":[3],"networks":[4],"(CNNs)":[5],"suffer":[6],"from":[7],"high":[8],"computational":[9],"complexity":[10],"due":[11],"to":[12,32,198],"excessive":[13],"convolution":[14,18,45],"operations.":[15],"Recently,":[16],"fast":[17,22,58,193],"algorithms":[19],"such":[20],"as":[21],"Fourier":[23],"transform":[24,28,55,91],"(FFT)":[25],"and":[26,72,103,110,122,146,162,179,186],"Winograd":[27],"have":[29,62],"gained":[30],"attention":[31],"address":[33],"this":[34,79],"problem.":[35],"They":[36],"reduce":[37],"the":[38,44,54,95,100,118,128,133,142,151,157,173,191],"number":[39,89],"of":[40],"multiplications":[41],"required":[42],"in":[43,53,75,127],"operation":[46],"by":[47],"replacing":[48],"it":[49,164],"with":[50,141],"element-wise":[51],"multiplication":[52],"domain.":[56],"However,":[57],"convolution-based":[59,194],"CNN":[60,85,154,168,195],"accelerators":[61,196],"three":[63],"major":[64],"concerns:":[65],"expensive":[66],"domain":[67,114],"transform,":[68,115],"large":[69],"memory":[70],"overhead,":[71],"limited":[73],"flexibility":[74],"kernel":[76],"size.":[77],"In":[78],"paper,":[80],"we":[81,149],"present":[82],"a":[83,171],"novel":[84],"accelerator":[86,134,155,175],"based":[87],"on":[88,156],"theoretic":[90],"(NTT),":[92],"which":[93,116],"overcomes":[94],"existing":[96,192],"limitations.":[97],"We":[98,130],"propose":[99,132],"low-cost":[101],"NTT":[102],"inverse-NTT":[104],"converter":[105],"that":[106,136],"only":[107],"use":[108],"adders":[109],"shifters":[111],"for":[112,165,183],"on-chip":[113],"solves":[117],"inflated":[119],"bandwidth":[120],"problem":[121],"enables":[123],"more":[124],"parallel":[125],"computations":[126],"accelerator.":[129],"also":[131],"architecture":[135],"includes":[137],"multiple":[138],"tile":[139],"engines":[140],"optimized":[143],"data":[144],"flow":[145],"mapping.":[147],"Finally,":[148],"implement":[150],"proposed":[152,174],"NTT-based":[153],"Xilinx":[158],"Alveo":[159],"U50":[160],"FPGA":[161],"evaluate":[163],"popular":[166],"models.":[169],"As":[170],"result,":[172],"achieves":[176],"2859.5,":[177],"990.3,":[178],"805.6":[180],"GOPS":[181],"throughput":[182],"VGG-16,":[184],"GoogLeNet,":[185],"Darknet-19,":[187],"respectively.":[188],"It":[189],"outperforms":[190],"up":[197],"<inline-formula":[199],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[200],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[201],"<tex-math":[202],"notation=\"LaTeX\">$9.6\\times":[203],"$":[204],"</tex-math></inline-formula>":[205],".":[206]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
