{"id":"https://openalex.org/W4416306874","doi":"https://doi.org/10.1007/s42514-025-00253-y","title":"Optimizing Standard Convolution for Diverse Precision on DCU","display_name":"Optimizing Standard Convolution for Diverse Precision on DCU","publication_year":2025,"publication_date":"2025-11-18","ids":{"openalex":"https://openalex.org/W4416306874","doi":"https://doi.org/10.1007/s42514-025-00253-y"},"language":"en","primary_location":{"id":"doi:10.1007/s42514-025-00253-y","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s42514-025-00253-y","pdf_url":null,"source":{"id":"https://openalex.org/S4210190911","display_name":"CCF Transactions on High Performance Computing","issn_l":"2524-4922","issn":["2524-4922","2524-4930"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"CCF Transactions on High Performance Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070079841","display_name":"Haobo Hua","orcid":"https://orcid.org/0000-0002-8015-6392"},"institutions":[{"id":"https://openalex.org/I192868223","display_name":"Zhengzhou University of Aeronautics","ror":"https://ror.org/01qjyzh50","country_code":"CN","type":"education","lineage":["https://openalex.org/I192868223"]},{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haobo Hua","raw_affiliation_strings":["Henan Paifu Information Technology Co., Ltd., No.289 West 3rd Ring Road, Zhengzhou, 450001, Henan, China","National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","School of Mathematics, Zhengzhou University of Aeronautics, No. 15 Wenyuan Road, Zhengzhou, 450046, Henan, China"],"raw_orcid":"https://orcid.org/0000-0002-8015-6392","affiliations":[{"raw_affiliation_string":"Henan Paifu Information Technology Co., Ltd., No.289 West 3rd Ring Road, Zhengzhou, 450001, Henan, China","institution_ids":[]},{"raw_affiliation_string":"National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]},{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]},{"raw_affiliation_string":"School of Mathematics, Zhengzhou University of Aeronautics, No. 15 Wenyuan Road, Zhengzhou, 450046, Henan, China","institution_ids":["https://openalex.org/I192868223"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120502898","display_name":"Chuangzheng Hou","orcid":null},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuangzheng Hou","raw_affiliation_strings":["National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]},{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhuxin Wen","orcid":null},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuxin Wen","raw_affiliation_strings":["National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]},{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013780891","display_name":"Xiangkai Zhang","orcid":"https://orcid.org/0000-0002-9294-3289"},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangkai Zhang","raw_affiliation_strings":["National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]},{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101753920","display_name":"Xiaodong Yu","orcid":"https://orcid.org/0000-0003-0826-1056"},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodong Yu","raw_affiliation_strings":["National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]},{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022800604","display_name":"Jiandong Shang","orcid":"https://orcid.org/0009-0001-7673-2641"},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiandong Shang","raw_affiliation_strings":["National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China"],"raw_orcid":"https://orcid.org/0009-0001-7673-2641","affiliations":[{"raw_affiliation_string":"National Supercomputing Center in Zhengzhou, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]},{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, No.100 Science Avenue, Zhengzhou, 450001, Henan, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101674463","display_name":"Litao Zhang","orcid":"https://orcid.org/0000-0001-5771-1928"},"institutions":[{"id":"https://openalex.org/I192868223","display_name":"Zhengzhou University of Aeronautics","ror":"https://ror.org/01qjyzh50","country_code":"CN","type":"education","lineage":["https://openalex.org/I192868223"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Litao Zhang","raw_affiliation_strings":["School of Mathematics, Zhengzhou University of Aeronautics, No. 15 Wenyuan Road, Zhengzhou, 450046, Henan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mathematics, Zhengzhou University of Aeronautics, No. 15 Wenyuan Road, Zhengzhou, 450046, Henan, China","institution_ids":["https://openalex.org/I192868223"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5070079841"],"corresponding_institution_ids":["https://openalex.org/I192868223","https://openalex.org/I38877650"],"apc_list":{"value":2190,"currency":"EUR","value_usd":2790},"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.33731479,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"8","issue":"1","first_page":"61","last_page":"79"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8460999727249146,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8460999727249146,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.026499999687075615,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.01640000008046627,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.727400004863739},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.632099986076355},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6137999892234802},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.5979999899864197},{"id":"https://openalex.org/keywords/memory-hierarchy","display_name":"Memory hierarchy","score":0.5907999873161316},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5281999707221985},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4706999957561493},{"id":"https://openalex.org/keywords/adder","display_name":"Adder","score":0.3041999936103821}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7942000031471252},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.727400004863739},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.632099986076355},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6137999892234802},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6047999858856201},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.5979999899864197},{"id":"https://openalex.org/C2778100165","wikidata":"https://www.wikidata.org/wiki/Q1589327","display_name":"Memory hierarchy","level":3,"score":0.5907999873161316},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5281999707221985},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.4966999888420105},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4706999957561493},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.34200000762939453},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3327000141143799},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3075999915599823},{"id":"https://openalex.org/C164620267","wikidata":"https://www.wikidata.org/wiki/Q376953","display_name":"Adder","level":3,"score":0.3041999936103821},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.29679998755455017},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2944999933242798},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.29030001163482666},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2793000042438507},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2653000056743622},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2590000033378601},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.257999986410141},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.2574000060558319},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.2540999948978424},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s42514-025-00253-y","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s42514-025-00253-y","pdf_url":null,"source":{"id":"https://openalex.org/S4210190911","display_name":"CCF Transactions on High Performance Computing","issn_l":"2524-4922","issn":["2524-4922","2524-4930"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"CCF Transactions on High Performance Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W2002555321","https://openalex.org/W2072912074","https://openalex.org/W2172654076","https://openalex.org/W2605739168","https://openalex.org/W2617819327","https://openalex.org/W2913790721","https://openalex.org/W2945580137","https://openalex.org/W2950649068","https://openalex.org/W2964017942","https://openalex.org/W2964157630","https://openalex.org/W2983670846","https://openalex.org/W2998957070","https://openalex.org/W3022446491","https://openalex.org/W3034326778","https://openalex.org/W3034339621","https://openalex.org/W3034681889","https://openalex.org/W3043216033","https://openalex.org/W3166036439","https://openalex.org/W3176305871","https://openalex.org/W4225124368","https://openalex.org/W4381280256","https://openalex.org/W4381893775","https://openalex.org/W4385698913","https://openalex.org/W4390651816","https://openalex.org/W4392855244","https://openalex.org/W4399154859","https://openalex.org/W4405361299","https://openalex.org/W4407857002","https://openalex.org/W4409465464"],"related_works":[],"abstract_inverted_index":null,"counts_by_year":[],"updated_date":"2026-02-11T14:41:00.668223","created_date":"2025-11-18T00:00:00"}
