{"id":"https://openalex.org/W4416429482","doi":"https://doi.org/10.1109/iccad66269.2025.11240837","title":"GPU Acceleration for Versatile Buffer Insertion","display_name":"GPU Acceleration for Versatile Buffer Insertion","publication_year":2025,"publication_date":"2025-10-26","ids":{"openalex":"https://openalex.org/W4416429482","doi":"https://doi.org/10.1109/iccad66269.2025.11240837"},"language":null,"primary_location":{"id":"doi:10.1109/iccad66269.2025.11240837","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccad66269.2025.11240837","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/ACM International Conference On Computer Aided Design (ICCAD)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101848345","display_name":"Yuan Pu","orcid":"https://orcid.org/0000-0002-1322-5642"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuan Pu","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109741306","display_name":"Yuhao Ji","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhao Ji","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112579216","display_name":"S.S. Yu","orcid":"https://orcid.org/0000-0003-1695-3925"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siying Yu","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045601421","display_name":"Zuodong Zhang","orcid":"https://orcid.org/0000-0002-8496-6114"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zuodong Zhang","raw_affiliation_strings":["Peking University"],"affiliations":[{"raw_affiliation_string":"Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039573083","display_name":"Zizheng Guo","orcid":"https://orcid.org/0000-0002-0724-5356"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zizheng Guo","raw_affiliation_strings":["Peking University"],"affiliations":[{"raw_affiliation_string":"Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039671544","display_name":"Zhuolun He","orcid":"https://orcid.org/0009-0009-4909-6588"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuolun He","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000933188","display_name":"Yibo Lin","orcid":"https://orcid.org/0000-0002-0977-2774"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yibo Lin","raw_affiliation_strings":["Peking University"],"affiliations":[{"raw_affiliation_string":"Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011883763","display_name":"David Z. Pan","orcid":"https://orcid.org/0000-0002-5705-2501"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Pan","raw_affiliation_strings":["University of Texas at Austin"],"affiliations":[{"raw_affiliation_string":"University of Texas at Austin","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051340429","display_name":"Bei Yu","orcid":"https://orcid.org/0000-0001-6406-4810"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bei Yu","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5101848345"],"corresponding_institution_ids":["https://openalex.org/I177725633"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.40922129,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.4108999967575073,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.4108999967575073,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10363","display_name":"Low-power high-performance VLSI design","score":0.2587999999523163,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.22120000422000885,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.651199996471405},{"id":"https://openalex.org/keywords/buffer","display_name":"Buffer (optical fiber)","score":0.5364999771118164},{"id":"https://openalex.org/keywords/capacitance","display_name":"Capacitance","score":0.5333999991416931},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.525600016117096},{"id":"https://openalex.org/keywords/place-and-route","display_name":"Place and route","score":0.451200008392334},{"id":"https://openalex.org/keywords/execution-time","display_name":"Execution time","score":0.391400009393692},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.3431999981403351},{"id":"https://openalex.org/keywords/algorithm-design","display_name":"Algorithm design","score":0.3314000070095062}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7910000085830688},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.651199996471405},{"id":"https://openalex.org/C145018004","wikidata":"https://www.wikidata.org/wiki/Q4985944","display_name":"Buffer (optical fiber)","level":2,"score":0.5364999771118164},{"id":"https://openalex.org/C30066665","wikidata":"https://www.wikidata.org/wiki/Q164399","display_name":"Capacitance","level":3,"score":0.5333999991416931},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5271999835968018},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.525600016117096},{"id":"https://openalex.org/C127879752","wikidata":"https://www.wikidata.org/wiki/Q3390760","display_name":"Place and route","level":3,"score":0.451200008392334},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.391400009393692},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3707999885082245},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.3431999981403351},{"id":"https://openalex.org/C106516650","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm design","level":2,"score":0.3314000070095062},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.2827000021934509},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.28049999475479126},{"id":"https://openalex.org/C14580979","wikidata":"https://www.wikidata.org/wiki/Q876049","display_name":"Very-large-scale integration","level":2,"score":0.27959999442100525},{"id":"https://openalex.org/C64260653","wikidata":"https://www.wikidata.org/wiki/Q1194864","display_name":"Electronic design automation","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C2777418626","wikidata":"https://www.wikidata.org/wiki/Q2584887","display_name":"Electrical capacitance tomography","level":4,"score":0.26820001006126404},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.25609999895095825},{"id":"https://openalex.org/C3017489831","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Running time","level":2,"score":0.2540000081062317},{"id":"https://openalex.org/C530198007","wikidata":"https://www.wikidata.org/wiki/Q80831","display_name":"Integrated circuit","level":2,"score":0.250900000333786},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccad66269.2025.11240837","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccad66269.2025.11240837","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/ACM International Conference On Computer Aided Design (ICCAD)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1966211539","https://openalex.org/W1976809982","https://openalex.org/W2094517495","https://openalex.org/W2100015970","https://openalex.org/W2101987243","https://openalex.org/W2118412523","https://openalex.org/W2123316553","https://openalex.org/W2125831674","https://openalex.org/W2127434816","https://openalex.org/W2133171792","https://openalex.org/W2136176071","https://openalex.org/W2160252016","https://openalex.org/W2165120956","https://openalex.org/W2296726406","https://openalex.org/W2945592068","https://openalex.org/W3027968530","https://openalex.org/W4231702789","https://openalex.org/W4235073116","https://openalex.org/W4235722324","https://openalex.org/W4236913175","https://openalex.org/W4244294857","https://openalex.org/W4249030878","https://openalex.org/W4252483151","https://openalex.org/W4256482602","https://openalex.org/W4381415966"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,21,28,107,128,151,182],"advancement":[2],"of":[3,66,89,110,132,153,158],"circuit":[4],"design":[5,23],"complexity":[6],"and":[7,26,49,84,100,174],"technology":[8],"nodes,":[9],"buffer":[10,44],"insertion":[11],"has":[12],"become":[13],"pivotal":[14],"in":[15,102],"mitigating":[16],"timing":[17,67],"violations,":[18,83,95],"significantly":[19],"impacting":[20],"physical":[22],"development":[24],"cycle":[25],"highlighting":[27],"necessity":[29],"for":[30,43,62,79,93],"acceleration":[31],"methodologies.":[32],"In":[33,69],"this":[34],"paper,":[35],"we":[36,71],"present":[37],"BIGX,":[38],"a":[39,74,86,116,176],"GPU-accelerated":[40],"algorithmic":[41],"framework":[42],"insertion.":[45],"BIGX":[46,114,155,165,180],"is":[47],"versatile":[48],"can":[50],"be":[51],"adapted":[52],"to":[53,105,135,163,193],"implement":[54],"different":[55],"dynamic":[56],"programming":[57],"(DP)":[58],"based":[59,121],"buffering":[60,77,112],"algorithms":[61,97],"repairing":[63,80],"various":[64],"types":[65],"violations.":[68,161],"particular,":[70],"introduce":[72],"MCDP,":[73,154],"dedicated":[75],"DP-based":[76,111],"algorithm":[78,92,120,185],"maximum":[81,159,171],"capacitance":[82,160,172],"propose":[85],"parallel":[87],"version":[88],"Van":[90,183],"Ginneken\u2019s":[91,184],"setup":[94],"both":[96],"are":[98],"incorporated":[99],"implemented":[101],"BIGX.":[103],"Furthermore,":[104],"overcome":[106],"runtime":[108],"limitations":[109],"algorithms,":[113],"adopts":[115],"distributed":[117],"Branch":[118],"Merge":[119],"on":[122,145],"bucket":[123],"sorting,":[124],"which":[125],"fully":[126],"leverages":[127],"hierarchical":[129],"memory":[130],"architecture":[131],"modern":[133],"GPUs":[134],"achieve":[136],"substantial":[137],"speedups":[138],"while":[139,188],"preserving":[140],"solution":[141,191],"quality.":[142],"Experimental":[143],"results":[144],"industrial":[146],"benchmarks":[147],"demonstrate":[148],"that,":[149],"with":[150,166],"integration":[152],"repairs":[156,168],"96.6%":[157],"Compared":[162],"OpenROAD,":[164],"MCDP":[167],"2.54x":[169],"more":[170],"violations":[173],"delivers":[175],"3.37x":[177],"speedup.":[178],"Additionally,":[179],"accelerates":[181],"by":[186],"11.68x":[187],"maintaining":[189],"comparable":[190],"quality":[192],"its":[194],"CPU-based":[195],"counterpart.":[196]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-20T00:00:00"}
