{"id":"https://openalex.org/W7123353318","doi":"https://doi.org/10.1109/access.2026.3653253","title":"C-SIMD: CORDIC-Driven SIMD Processing Element for Resource-Efficient Multi-Precision Deep Learning Inference","display_name":"C-SIMD: CORDIC-Driven SIMD Processing Element for Resource-Efficient Multi-Precision Deep Learning Inference","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7123353318","doi":"https://doi.org/10.1109/access.2026.3653253"},"language":"en","primary_location":{"id":"doi:10.1109/access.2026.3653253","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3653253","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2026.3653253","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064547635","display_name":"Vasundhara Trivedi","orcid":"https://orcid.org/0009-0009-3787-6296"},"institutions":[{"id":"https://openalex.org/I64295750","display_name":"Indian Institute of Technology Indore","ror":"https://ror.org/01hhf7w52","country_code":"IN","type":"education","lineage":["https://openalex.org/I64295750"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Vasundhara Trivedi","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology Indore, Indore, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology Indore, Indore, India","institution_ids":["https://openalex.org/I64295750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028707436","display_name":"Gopal Raut","orcid":"https://orcid.org/0000-0002-1046-9457"},"institutions":[{"id":"https://openalex.org/I176601375","display_name":"Khalifa University of Science and Technology","ror":"https://ror.org/05hffr360","country_code":"AE","type":"education","lineage":["https://openalex.org/I176601375"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Gopal Raut","raw_affiliation_strings":["Khalifa University, Abu Dhabi, United Arab Emirates"],"affiliations":[{"raw_affiliation_string":"Khalifa University, Abu Dhabi, United Arab Emirates","institution_ids":["https://openalex.org/I176601375"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121876813","display_name":"Baker Mohammad","orcid":null},"institutions":[{"id":"https://openalex.org/I176601375","display_name":"Khalifa University of Science and Technology","ror":"https://ror.org/05hffr360","country_code":"AE","type":"education","lineage":["https://openalex.org/I176601375"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Baker Mohammad","raw_affiliation_strings":["Khalifa University, Abu Dhabi, United Arab Emirates"],"affiliations":[{"raw_affiliation_string":"Khalifa University, Abu Dhabi, United Arab Emirates","institution_ids":["https://openalex.org/I176601375"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068792760","display_name":"Santosh Kumar Vishvakarma","orcid":"https://orcid.org/0000-0003-4223-0077"},"institutions":[{"id":"https://openalex.org/I64295750","display_name":"Indian Institute of Technology Indore","ror":"https://ror.org/01hhf7w52","country_code":"IN","type":"education","lineage":["https://openalex.org/I64295750"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Santosh Kumar Vishvakarma","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology Indore, Indore, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology Indore, Indore, India","institution_ids":["https://openalex.org/I64295750"]}]},{"author_position":"last","author":{"id":null,"display_name":"Akash Kumar","orcid":"https://orcid.org/0000-0001-7125-1737"},"institutions":[{"id":"https://openalex.org/I904495901","display_name":"Ruhr University Bochum","ror":"https://ror.org/04tsk2644","country_code":"DE","type":"education","lineage":["https://openalex.org/I904495901"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Akash Kumar","raw_affiliation_strings":["Chair of Embedded Systems, Ruhr University Bochum, Bochum, Germany"],"affiliations":[{"raw_affiliation_string":"Chair of Embedded Systems, Ruhr University Bochum, Bochum, Germany","institution_ids":["https://openalex.org/I904495901"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5064547635"],"corresponding_institution_ids":["https://openalex.org/I64295750"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12049494,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":null,"first_page":"19015","last_page":"19029"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.39070001244544983,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11697","display_name":"Numerical Methods and Algorithms","score":0.39070001244544983,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.09510000050067902,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10363","display_name":"Low-power high-performance VLSI design","score":0.05820000171661377,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.8054999709129333},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.683899998664856},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.6456999778747559},{"id":"https://openalex.org/keywords/operand","display_name":"Operand","score":0.6377999782562256},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5892000198364258},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5705999732017517},{"id":"https://openalex.org/keywords/adder","display_name":"Adder","score":0.5694000124931335},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5692999958992004},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.46070000529289246}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8705000281333923},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.8054999709129333},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.683899998664856},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.6456999778747559},{"id":"https://openalex.org/C55526617","wikidata":"https://www.wikidata.org/wiki/Q719375","display_name":"Operand","level":2,"score":0.6377999782562256},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6028000116348267},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5892000198364258},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5705999732017517},{"id":"https://openalex.org/C164620267","wikidata":"https://www.wikidata.org/wiki/Q376953","display_name":"Adder","level":3,"score":0.5694000124931335},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5692999958992004},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.46070000529289246},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.43869999051094055},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.4381999969482422},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40869998931884766},{"id":"https://openalex.org/C106515295","wikidata":"https://www.wikidata.org/wiki/Q26806595","display_name":"Parallel processing","level":2,"score":0.38749998807907104},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.3702000081539154},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.3422999978065491},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3375999927520752},{"id":"https://openalex.org/C107598950","wikidata":"https://www.wikidata.org/wiki/Q259864","display_name":"Microarchitecture","level":2,"score":0.32420000433921814},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.32339999079704285},{"id":"https://openalex.org/C65232700","wikidata":"https://www.wikidata.org/wiki/Q5656403","display_name":"Hardware architecture","level":3,"score":0.32179999351501465},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3181999921798706},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.3059999942779541},{"id":"https://openalex.org/C170595534","wikidata":"https://www.wikidata.org/wiki/Q249743","display_name":"Very long instruction word","level":2,"score":0.2973000109195709},{"id":"https://openalex.org/C97137487","wikidata":"https://www.wikidata.org/wiki/Q729138","display_name":"Integer (computer science)","level":2,"score":0.2867000102996826},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.2809999883174896},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2784000039100647},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.2775000035762787},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.27720001339912415},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.2703999876976013},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.26260000467300415},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.26260000467300415},{"id":"https://openalex.org/C58013763","wikidata":"https://www.wikidata.org/wiki/Q5754574","display_name":"High-level synthesis","level":3,"score":0.2597000002861023}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2026.3653253","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3653253","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:354bc9de83c44c78be6ebf1c52c3b49e","is_oa":true,"landing_page_url":"https://doaj.org/article/354bc9de83c44c78be6ebf1c52c3b49e","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 14, Pp 19015-19029 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2026.3653253","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3653253","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1985956780","https://openalex.org/W2044829853","https://openalex.org/W2115452265","https://openalex.org/W2204073782","https://openalex.org/W2204310803","https://openalex.org/W2593564159","https://openalex.org/W2594492285","https://openalex.org/W2604319603","https://openalex.org/W2895531329","https://openalex.org/W2914973130","https://openalex.org/W2952857977","https://openalex.org/W2963367920","https://openalex.org/W2964504576","https://openalex.org/W2965976751","https://openalex.org/W2971946864","https://openalex.org/W3000371584","https://openalex.org/W3025143601","https://openalex.org/W3041601967","https://openalex.org/W3047364742","https://openalex.org/W3048933702","https://openalex.org/W3090369187","https://openalex.org/W3113606433","https://openalex.org/W3124625166","https://openalex.org/W3176754014","https://openalex.org/W3185215509","https://openalex.org/W3187235458","https://openalex.org/W4206262671","https://openalex.org/W4206957512","https://openalex.org/W4212886211","https://openalex.org/W4220829081","https://openalex.org/W4247198796","https://openalex.org/W4280493494","https://openalex.org/W4285250061","https://openalex.org/W4294691819","https://openalex.org/W4323345742","https://openalex.org/W4327522190","https://openalex.org/W4375861680","https://openalex.org/W4385575752","https://openalex.org/W4392979932","https://openalex.org/W4396949147"],"related_works":[],"abstract_inverted_index":{"The":[0,153],"growing":[1],"demand":[2],"for":[3,31,95,200],"efficient":[4],"deep":[5],"learning":[6],"inference":[7],"on":[8,182,186,192],"edge":[9],"devices":[10],"requires":[11],"hardware":[12],"that":[13],"is":[14],"both":[15],"precision-adaptive":[16],"and":[17,45,48,54,79,90,109,121,134,146,188],"resource-efficient.":[18],"This":[19],"paper":[20],"introduces":[21],"C-SIMD,":[22],"a":[23,167],"CORDIC-driven,":[24],"configurable":[25,83],"SIMD":[26],"Processing":[27],"Element":[28],"(PE)":[29],"architecture":[30,69],"scalable,":[32],"multi-precision":[33],"MAC":[34,173],"operations":[35],"in":[36,103],"DNN":[37],"accelerators.":[38],"C-SIMD":[39,93,116],"supports":[40,122],"dynamic":[41],"operand":[42],"precision":[43,74],"(4/8/16/32-bit)":[44],"enables":[46],"symmetric":[47],"asymmetric":[49,135],"computation":[50,61],"modes,":[51],"covering":[52],"integer":[53],"fixed-point":[55],"arithmetic.":[56],"By":[57],"leveraging":[58],"partial":[59],"product":[60],"with":[62],"pipelined":[63],"8-bit":[64],"CORDIC-based":[65],"approximate":[66],"multipliers,":[67],"the":[68,101,104],"scales":[70],"efficiently":[71],"to":[72,142,195],"higher":[73],"while":[75,160],"achieving":[76],"notable":[77],"area":[78,144],"power":[80],"savings.":[81],"A":[82],"pipeline":[84],"offers":[85],"tunable":[86],"trade-offs":[87],"between":[88],"accuracy":[89,179],"complexity,":[91],"making":[92],"suitable":[94],"resource-constrained":[96],"inference.":[97],"Strategic":[98],"reuse":[99],"of":[100],"adder":[102],"accumulation":[105],"path":[106],"enhances":[107],"throughput":[108,151],"optimizes":[110],"resource":[111],"utilization.":[112],"Unlike":[113],"prior":[114,172],"designs,":[115],"fully":[117],"exploits":[118],"available":[119],"resources":[120],"configurations":[123],"such":[124],"as":[125,147,149],"16":[126],"parallel":[127,130],"8\u00d78-bit,":[128],"4":[129],"16\u00d716-bit,":[131],"single":[132],"32\u00d732-bit,":[133],"32\u00d78-bit":[136],"MACs.":[137],"Hardware":[138],"evaluation":[139],"demonstrates":[140],"up":[141],"14.29%":[143],"savings":[145],"much":[148],"16.17\u00d7":[150],"improvement.":[152],"proposed":[154],"C-SIMD_Low":[155],"(4/8/16)":[156],"achieves":[157],"7.04":[158],"GOP/s,":[159,165],"C-SIMD_High":[161],"(8/16/32)":[162],"attains":[163],"4.16":[164],"delivering":[166],"4\u00d7":[168],"performance-efficiency":[169],"gain":[170],"over":[171],"architectures.":[174],"Inference":[175],"tests":[176],"indicate":[177],"minimal":[178],"loss\u2014below":[180],"1%":[181],"MNIST-LeNet,":[183],"under":[184],"2.9%":[185],"CIFAR-10-AlexNet,":[187],"less":[189],"than":[190],"2.2%":[191],"CIFAR-10-VGG16":[193],"compared":[194],"float32":[196],"baselines\u2014demonstrating":[197],"its":[198],"potential":[199],"high-throughput,":[201],"energy-efficient":[202],"Edge-AI":[203],"systems.":[204]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2026-01-14T00:00:00"}
