{"id":"https://openalex.org/W4392265925","doi":"https://doi.org/10.1109/cgo57630.2024.10444807","title":"Revamping Sampling-Based PGO with Context-Sensitivity and Pseudo-instrumentation","display_name":"Revamping Sampling-Based PGO with Context-Sensitivity and Pseudo-instrumentation","publication_year":2024,"publication_date":"2024-02-28","ids":{"openalex":"https://openalex.org/W4392265925","doi":"https://doi.org/10.1109/cgo57630.2024.10444807"},"language":"en","primary_location":{"id":"doi:10.1109/cgo57630.2024.10444807","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cgo57630.2024.10444807","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/ACM International Symposium on Code Generation and Optimization (CGO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111137643","display_name":"Wenlei He","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wenlei He","raw_affiliation_strings":["Meta Inc.,USA","Meta Inc., USA"],"affiliations":[{"raw_affiliation_string":"Meta Inc.,USA","institution_ids":[]},{"raw_affiliation_string":"Meta Inc., USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052620797","display_name":"Hongtao Yu","orcid":"https://orcid.org/0000-0003-1785-972X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hongtao Yu","raw_affiliation_strings":["Meta Inc.,USA","Meta Inc., USA"],"affiliations":[{"raw_affiliation_string":"Meta Inc.,USA","institution_ids":[]},{"raw_affiliation_string":"Meta Inc., USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111939510","display_name":"Lei Wang","orcid":"https://orcid.org/0000-0003-3249-7333"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei Wang","raw_affiliation_strings":["Meta Inc.,USA","Meta Inc., USA"],"affiliations":[{"raw_affiliation_string":"Meta Inc.,USA","institution_ids":[]},{"raw_affiliation_string":"Meta Inc., USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5114131269","display_name":"Taewook Oh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taewook Oh","raw_affiliation_strings":["Meta Inc.,USA","Meta Inc., USA"],"affiliations":[{"raw_affiliation_string":"Meta Inc.,USA","institution_ids":[]},{"raw_affiliation_string":"Meta Inc., USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5111137643"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.4133,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.93259407,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"322","last_page":"333"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12452","display_name":"Electrowetting and Microfluidic Technologies","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/instrumentation","display_name":"Instrumentation (computer programming)","score":0.8102226853370667},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7460981607437134},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7384097576141357},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.5755264759063721},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.546999990940094},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5429579615592957},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.5162765383720398},{"id":"https://openalex.org/keywords/data-center","display_name":"Data center","score":0.4573497176170349},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.40902507305145264},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3611134886741638},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.33981460332870483},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1382116973400116},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.09738868474960327},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.07194310426712036}],"concepts":[{"id":"https://openalex.org/C118530786","wikidata":"https://www.wikidata.org/wiki/Q1134732","display_name":"Instrumentation (computer programming)","level":2,"score":0.8102226853370667},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7460981607437134},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7384097576141357},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.5755264759063721},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.546999990940094},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5429579615592957},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.5162765383720398},{"id":"https://openalex.org/C153740404","wikidata":"https://www.wikidata.org/wiki/Q671224","display_name":"Data center","level":2,"score":0.4573497176170349},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.40902507305145264},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3611134886741638},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.33981460332870483},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1382116973400116},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.09738868474960327},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.07194310426712036},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cgo57630.2024.10444807","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cgo57630.2024.10444807","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/ACM International Symposium on Code Generation and Optimization (CGO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1968131528","https://openalex.org/W1975332288","https://openalex.org/W2001055007","https://openalex.org/W2022666100","https://openalex.org/W2031487553","https://openalex.org/W2068640305","https://openalex.org/W2157775926","https://openalex.org/W2303680680","https://openalex.org/W2607905318","https://openalex.org/W2891545657","https://openalex.org/W2952416601","https://openalex.org/W3103670547","https://openalex.org/W4205582557","https://openalex.org/W4238089251","https://openalex.org/W4241315977","https://openalex.org/W4246166885","https://openalex.org/W4247444363","https://openalex.org/W4249818463","https://openalex.org/W4252857370","https://openalex.org/W4255078887","https://openalex.org/W4255185178","https://openalex.org/W4302828500","https://openalex.org/W4318541549","https://openalex.org/W6638039902","https://openalex.org/W6696599122"],"related_works":["https://openalex.org/W562823126","https://openalex.org/W2106037662","https://openalex.org/W1530419332","https://openalex.org/W2045782830","https://openalex.org/W2143942744","https://openalex.org/W2469134140","https://openalex.org/W2165392093","https://openalex.org/W1972557159","https://openalex.org/W2993874308","https://openalex.org/W2809058302"],"abstract_inverted_index":{"The":[0,87],"ever":[1],"increasing":[2],"scale":[3],"of":[4,17,37,47,91,151,184,201],"modern":[5],"data":[6,41,186],"center":[7,187],"demands":[8],"more":[9,123,162],"effective":[10,163],"optimizations,":[11],"as":[12,81,83],"even":[13],"a":[14,23,54,113,122,166],"small":[15],"percentage":[16],"performance":[18,77,105,130,197],"improvement":[19,198],"can":[20],"result":[21],"in":[22,26,40,66],"significant":[24],"reduction":[25],"data-center":[27,67],"cost":[28],"and":[29,173],"its":[30,71,99,103],"environmental":[31],"footprint.":[32],"However,":[33],"the":[34,45,76,84,95,149],"diverse":[35],"set":[36],"workloads":[38,194],"running":[39],"centers":[42],"also":[43,155],"challenges":[44],"scalability":[46],"optimization":[48,51],"solutions.":[49],"Profile-guided":[50],"(PGO)":[52],"is":[53,63,177],"promising":[55],"technique":[56],"to":[57,70,126,132,143,160,180],"improve":[58,144],"application":[59],"performance.":[60],"Sampling-based":[61],"PGO":[62,116,129,134],"widely":[64],"used":[65,179],"applications":[68],"due":[69],"low":[72],"operational":[73,89,138],"overhead,":[74],"but":[75],"gains":[78],"are":[79],"not":[80],"substantial":[82],"instrumentation-based":[85,92,133],"counterpart.":[86],"high":[88],"overhead":[90,150],"PGO,":[93],"on":[94,199],"other":[96],"hand,":[97],"hinders":[98],"large-scale":[100],"adoption,":[101],"despite":[102],"superior":[104],"gains.":[106],"In":[107],"this":[108],"paper,":[109],"we":[110],"propose":[111],"CSSPGO,":[112],"context-sensitive":[114],"sampling-based":[115,128,203],"framework":[117],"with":[118,158,192],"pseudo-instrumentation.":[119],"CSSPGO":[120,176],"offers":[121],"balanced":[124],"solution":[125],"push":[127],"closer":[131],"while":[135],"maintaining":[136],"minimal":[137],"overhead.":[139],"It":[140,154],"leverages":[141],"pseudo-instrumentation":[142],"profile":[145,157],"quality":[146],"without":[147],"incurring":[148],"traditional":[152],"instrumentation.":[153],"enriches":[156],"context-sensitivity":[159],"aid":[161],"optimizations":[164],"through":[165],"novel":[167],"profiling":[168],"methodology":[169],"using":[170],"synchronized":[171],"LBR":[172],"stack":[174],"sampling.":[175],"now":[178],"optimize":[181],"over":[182],"75%":[183],"Meta's":[185],"CPU":[188],"cycles.":[189],"Our":[190],"evaluation":[191],"production":[193],"demonstrates":[195],"1%-5%":[196],"top":[200],"state-of-the-art":[202],"PGO.":[204]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":5}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
