{"id":"https://openalex.org/W4386763895","doi":"https://doi.org/10.1109/dac56929.2023.10247939","title":"Invited: Algorithm-Software-Hardware Co-Design for Deep Learning Acceleration","display_name":"Invited: Algorithm-Software-Hardware Co-Design for Deep Learning Acceleration","publication_year":2023,"publication_date":"2023-07-09","ids":{"openalex":"https://openalex.org/W4386763895","doi":"https://doi.org/10.1109/dac56929.2023.10247939"},"language":"en","primary_location":{"id":"doi:10.1109/dac56929.2023.10247939","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/dac56929.2023.10247939","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 60th ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101633365","display_name":"Zhengang Li","orcid":"https://orcid.org/0000-0001-6644-4761"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":true,"raw_author_name":"Zhengang Li","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088784101","display_name":"Yanyue Xie","orcid":"https://orcid.org/0000-0002-4325-521X"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Yanyue Xie","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089349472","display_name":"Peiyan Dong","orcid":"https://orcid.org/0000-0001-5287-5149"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Peiyan Dong","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049723281","display_name":"Olivia Chen","orcid":"https://orcid.org/0000-0002-2208-0262"},"institutions":[{"id":"https://openalex.org/I185088104","display_name":"Tokyo City University","ror":"https://ror.org/04dt6bw53","country_code":"JP","type":"education","lineage":["https://openalex.org/I185088104"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Olivia Chen","raw_affiliation_strings":["Tokyo City University"],"affiliations":[{"raw_affiliation_string":"Tokyo City University","institution_ids":["https://openalex.org/I185088104"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100651384","display_name":"Yanzhi Wang","orcid":"https://orcid.org/0000-0002-3024-7990"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Yanzhi Wang","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101633365"],"corresponding_institution_ids":["https://openalex.org/I87182695"],"apc_list":null,"apc_paid":null,"fwci":0.1337,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.44304302,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13182","display_name":"Quantum-Dot Cellular Automata","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.7120554447174072},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7041209936141968},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.6387245655059814},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.6272120475769043},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5762506723403931},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5082561373710632},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.4871327579021454},{"id":"https://openalex.org/keywords/crossbar-switch","display_name":"Crossbar switch","score":0.4809098243713379},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.47516247630119324},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.42090827226638794},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.4162341356277466},{"id":"https://openalex.org/keywords/design-flow","display_name":"Design flow","score":0.4129208028316498},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.39539724588394165},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.3941950500011444},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3789594769477844},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.31200796365737915},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.28443625569343567},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24431651830673218},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12205949425697327}],"concepts":[{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.7120554447174072},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7041209936141968},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.6387245655059814},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.6272120475769043},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5762506723403931},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5082561373710632},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4871327579021454},{"id":"https://openalex.org/C29984679","wikidata":"https://www.wikidata.org/wiki/Q1929149","display_name":"Crossbar switch","level":2,"score":0.4809098243713379},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.47516247630119324},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.42090827226638794},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.4162341356277466},{"id":"https://openalex.org/C37135326","wikidata":"https://www.wikidata.org/wiki/Q931942","display_name":"Design flow","level":2,"score":0.4129208028316498},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.39539724588394165},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.3941950500011444},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3789594769477844},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.31200796365737915},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.28443625569343567},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24431651830673218},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12205949425697327},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dac56929.2023.10247939","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/dac56929.2023.10247939","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 60th ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8700000047683716,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1972669646","https://openalex.org/W1974638538","https://openalex.org/W2072434547","https://openalex.org/W2113535733","https://openalex.org/W2242818861","https://openalex.org/W2345373798","https://openalex.org/W2896983500","https://openalex.org/W2945528538","https://openalex.org/W2952257392","https://openalex.org/W2964125333","https://openalex.org/W4313152865","https://openalex.org/W6639703010","https://openalex.org/W6690026940","https://openalex.org/W6704722796","https://openalex.org/W6784333009","https://openalex.org/W6810818354","https://openalex.org/W6991793004"],"related_works":["https://openalex.org/W2058965144","https://openalex.org/W2164382479","https://openalex.org/W98480971","https://openalex.org/W2150291671","https://openalex.org/W2027972911","https://openalex.org/W2146343568","https://openalex.org/W1569655464","https://openalex.org/W2030843684","https://openalex.org/W2115150433","https://openalex.org/W2532502681"],"abstract_inverted_index":{"With":[0],"the":[1,29,75,103],"development":[2],"of":[3,31],"AI":[4],"techniques,":[5],"it":[6],"is":[7],"appealing":[8],"but":[9],"challenging":[10],"to":[11,115],"efficiently":[12],"deploy":[13],"deep":[14,32],"neural":[15,33],"networks":[16],"on":[17,49],"resource-constrained":[18],"devices.":[19],"This":[20],"paper":[21],"presents":[22],"two":[23],"novel":[24],"algorithm-software-hardware":[25],"co-designs":[26],"for":[27,45,67],"improving":[28],"performance":[30,113],"networks.":[34],"The":[35,59,81],"first":[36],"part":[37,61],"introduces":[38,62],"a":[39,63],"hardware-efficient":[40],"adaptive":[41],"token":[42],"pruning":[43],"framework":[44],"Vision":[46],"Transformers":[47],"(ViTs)":[48],"FPGA,":[50],"which":[51,94],"achieves":[52,95],"significant":[53],"speedup":[54],"under":[55],"similar":[56],"model":[57],"accuracy.":[58],"second":[60],"design":[64],"automation":[65],"flow":[66],"crossbar-based":[68],"Binary":[69],"Neural":[70],"Network":[71],"(BNN)":[72],"accelerators":[73],"using":[74],"emerging":[76],"technique":[77],"Adiabatic":[78],"Quantum-Flux-Parametron":[79],"(AQFP).":[80],"proposed":[82,109],"method":[83],"significantly":[84],"improves":[85],"energy":[86,99],"efficiency":[87,100],"by":[88],"combining":[89],"AQFP":[90],"with":[91,102],"BNN":[92],"together,":[93],"over":[96],"100\u00d7":[97],"better":[98],"compared":[101,114],"previous":[104],"representative":[105],"AQFP-based":[106],"framework.":[107],"Both":[108],"designs":[110],"demonstrate":[111],"superior":[112],"existing":[116],"methods.":[117]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
