{"id":"https://openalex.org/W4403278202","doi":"https://doi.org/10.1109/tcad.2024.3476450","title":"BAQE: Backend-Adaptive DNN Deployment via Synchronous Bayesian Quantization and Hardware Configuration Exploration","display_name":"BAQE: Backend-Adaptive DNN Deployment via Synchronous Bayesian Quantization and Hardware Configuration Exploration","publication_year":2024,"publication_date":"2024-10-09","ids":{"openalex":"https://openalex.org/W4403278202","doi":"https://doi.org/10.1109/tcad.2024.3476450"},"language":"en","primary_location":{"id":"doi:10.1109/tcad.2024.3476450","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2024.3476450","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013503446","display_name":"Wenqian Zhao","orcid":"https://orcid.org/0000-0001-9501-9254"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Wenqian Zhao","raw_affiliation_strings":["Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong"],"raw_orcid":"https://orcid.org/0000-0001-9501-9254","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101319284","display_name":"Shuo Yin","orcid":"https://orcid.org/0000-0003-4927-0194"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Shuo Yin","raw_affiliation_strings":["Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100662676","display_name":"Chen Bai","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Chen Bai","raw_affiliation_strings":["Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong"],"raw_orcid":"https://orcid.org/0000-0002-1742-0090","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032567340","display_name":"Zixiao Wang","orcid":"https://orcid.org/0009-0000-8179-0996"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zixiao Wang","raw_affiliation_strings":["Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong"],"raw_orcid":"https://orcid.org/0009-0000-8179-0996","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051340429","display_name":"Bei Yu","orcid":"https://orcid.org/0000-0001-6406-4810"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Bei Yu","raw_affiliation_strings":["Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong"],"raw_orcid":"https://orcid.org/0000-0001-6406-4810","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"NT, The Chinese University of Hong Kong, Department of Computer Science and Engineering, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5013503446"],"corresponding_institution_ids":["https://openalex.org/I177725633"],"apc_list":null,"apc_paid":null,"fwci":0.2353,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.56705882,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"44","issue":"4","first_page":"1394","last_page":"1405"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.7964788675308228},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.6313921213150024},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6278371214866638},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.4794953465461731},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.4369380474090576},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3603639602661133},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28810787200927734},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.20292463898658752},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.11292189359664917}],"concepts":[{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.7964788675308228},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.6313921213150024},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6278371214866638},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.4794953465461731},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.4369380474090576},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3603639602661133},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28810787200927734},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.20292463898658752},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.11292189359664917}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcad.2024.3476450","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcad.2024.3476450","pdf_url":null,"source":{"id":"https://openalex.org/S100835903","display_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","issn_l":"0278-0070","issn":["0278-0070","1937-4151"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2183341477","https://openalex.org/W2300242332","https://openalex.org/W2886851211","https://openalex.org/W2963122961","https://openalex.org/W2963273111","https://openalex.org/W2982041622","https://openalex.org/W2982479999","https://openalex.org/W3034719990","https://openalex.org/W3035332806","https://openalex.org/W3091795552","https://openalex.org/W3097304224","https://openalex.org/W3110519017","https://openalex.org/W3132597740","https://openalex.org/W3173648655","https://openalex.org/W3183734708","https://openalex.org/W4319459088","https://openalex.org/W4320067919","https://openalex.org/W4386108430","https://openalex.org/W4386858078","https://openalex.org/W4389523770","https://openalex.org/W6677658955","https://openalex.org/W6684191040","https://openalex.org/W6734062232","https://openalex.org/W6748224102","https://openalex.org/W6751349269","https://openalex.org/W6752057402","https://openalex.org/W6756979132","https://openalex.org/W6776767859","https://openalex.org/W6779728309","https://openalex.org/W6786271619","https://openalex.org/W6789240164"],"related_works":["https://openalex.org/W2770234245","https://openalex.org/W96612179","https://openalex.org/W4229499248","https://openalex.org/W2566006169","https://openalex.org/W1567818861","https://openalex.org/W2987774938","https://openalex.org/W4256492088","https://openalex.org/W632915154","https://openalex.org/W2055733372","https://openalex.org/W3022067003"],"abstract_inverted_index":{"Efficiently":[0],"deploying":[1],"deep":[2,101],"learning":[3,103],"(DL)":[4],"algorithms":[5],"on":[6,19,91,149],"different":[7,118],"hardware":[8,20,119,136],"backends":[9,116],"has":[10],"become":[11],"a":[12,46,61,87,97,169],"time-consuming":[13,83],"challenge.":[14],"Achieving":[15],"ultimate":[16],"inference":[17,164],"efficiency":[18],"requires":[21],"both":[22,69,162],"algorithm-level":[23,55],"model":[24,29,71,99],"compression":[25],"techniques,":[26],"such":[27,34],"as":[28,35,104],"quantization,":[30],"and":[31,38,56,74,82,122,143,166],"hardware-level":[32],"optimization,":[33],"operation":[36],"reconfiguration":[37],"scheduling.":[39],"In":[40],"this":[41,80],"article,":[42],"we":[43,65,85],"propose":[44,86],"BAQE,":[45],"unified":[47],"deployment":[48],"framework":[49],"that":[50,139,158],"bridges":[51],"the":[52,70,105,128,134,150],"gap":[53],"between":[54],"backend-level":[57],"optimization.":[58],"By":[59],"constructing":[60],"global":[62],"search":[63],"space,":[64],"can":[66,111],"synchronously":[67],"optimize":[68],"quantization":[72],"settings":[73],"backend":[75],"configuration":[76],"parameters.":[77],"To":[78],"accelerate":[79],"laborious":[81],"process,":[84],"searching":[88],"strategy":[89],"based":[90],"multiobjective":[92],"Bayesian":[93],"optimization":[94,129,171],"(BO)":[95],"using":[96],"Gaussian":[98],"with":[100,117,168],"kernel":[102],"surrogate":[106],"model.":[107],"More":[108],"importantly,":[109],"BAQE":[110],"easily":[112],"adapt":[113],"to":[114],"various":[115],"resources":[120],"efficiently":[121],"effectively.":[123],"Each":[124],"inner":[125],"step":[126],"of":[127,133],"process":[130],"is":[131],"aware":[132],"genuine":[135],"resources,":[137],"ensuring":[138],"all":[140],"accuracy/latency":[141],"metrics":[142],"historical":[144],"knowledge/feedback":[145],"are":[146],"evaluated":[147],"directly":[148],"device":[151],"within":[152],"each":[153],"iteration.":[154],"Empirical":[155],"results":[156],"demonstrate":[157],"our":[159],"approach":[160],"achieves":[161],"superior":[163],"time":[165],"accuracy":[167],"faster":[170],"process.":[172]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
