{"id":"https://openalex.org/W4407385483","doi":"https://doi.org/10.14778/3696435.3696436","title":"The Key to Effective UDF Optimization: Before Inlining, First Perform Outlining","display_name":"The Key to Effective UDF Optimization: Before Inlining, First Perform Outlining","publication_year":2024,"publication_date":"2024-09-01","ids":{"openalex":"https://openalex.org/W4407385483","doi":"https://doi.org/10.14778/3696435.3696436"},"language":"en","primary_location":{"id":"doi:10.14778/3696435.3696436","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3696435.3696436","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006653831","display_name":"Samuel Arch","orcid":"https://orcid.org/0000-0001-7282-1658"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Samuel Arch","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100373065","display_name":"Yuchen Liu","orcid":"https://orcid.org/0000-0003-4767-0047"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuchen Liu","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076667915","display_name":"Todd C. Mowry","orcid":"https://orcid.org/0000-0003-4076-5684"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Todd C. Mowry","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069237428","display_name":"Jignesh M. Patel","orcid":"https://orcid.org/0000-0003-3653-2538"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jignesh M. Patel","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049165312","display_name":"Andrew Pavlo","orcid":"https://orcid.org/0000-0001-6040-6991"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew Pavlo","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5006653831"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":1.8213,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.86908327,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"18","issue":"1","first_page":"1","last_page":"13"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11950","display_name":"Cardiovascular Syncope and Autonomic Disorders","score":0.8607000112533569,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11950","display_name":"Cardiovascular Syncope and Autonomic Disorders","score":0.8607000112533569,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.8141999840736389,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11217","display_name":"Cardiac Arrhythmias and Treatments","score":0.7515000104904175,"subfield":{"id":"https://openalex.org/subfields/2705","display_name":"Cardiology and Cardiovascular Medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.7470279335975647},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5958302021026611},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.18465763330459595}],"concepts":[{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.7470279335975647},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5958302021026611},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.18465763330459595}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3696435.3696436","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3696435.3696436","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W173430487","https://openalex.org/W1571150310","https://openalex.org/W1969460277","https://openalex.org/W2007845800","https://openalex.org/W2008116177","https://openalex.org/W2049594497","https://openalex.org/W2057651724","https://openalex.org/W2060542629","https://openalex.org/W2127637733","https://openalex.org/W2963741525","https://openalex.org/W2970388058","https://openalex.org/W3023740622","https://openalex.org/W3029703673","https://openalex.org/W3085921543","https://openalex.org/W3135575949","https://openalex.org/W3164278511","https://openalex.org/W3173732543","https://openalex.org/W4210272490","https://openalex.org/W4246166885","https://openalex.org/W4312936523","https://openalex.org/W4386128201"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Although":[0,40],"user-defined":[1],"functions":[2],"(UDFs)":[3],"are":[4],"a":[5,22,93,100,138],"popular":[6],"way":[7],"to":[8,61,68,95],"augment":[9],"SQL's":[10],"declarative":[11],"approach":[12,66],"with":[13,36],"procedural":[14],"code,":[15],"the":[16,56,70,80,103],"mismatch":[17],"between":[18],"programming":[19],"paradigms":[20],"creates":[21],"fundamental":[23],"optimization":[24],"challenge.":[25],"UDF":[26,31,58,91,101,119],"inlining":[27,41,55,125],"automatically":[28],"removes":[29],"all":[30],"calls":[32],"by":[33,148],"replacing":[34],"them":[35],"equivalent":[37],"SQL":[38,46,135],"subqueries.":[39],"leaves":[42],"queries":[43],"entirely":[44],"in":[45,48,106],"(resulting":[47],"large":[49],"performance":[50,122],"gains),":[51],"we":[52,89],"observe":[53],"that":[54,82,118],"entire":[57],"often":[59],"leads":[60],"sub-optimal":[62],"performance.":[63],"A":[64],"better":[65],"is":[67],"analyze":[69],"UDF,":[71],"deconstruct":[72],"it":[73],"into":[74],"smaller":[75],"pieces,":[76],"and":[77,109,132,147],"inline":[78],"only":[79],"pieces":[81,98],"help":[83],"query":[84,112],"optimization.":[85],"To":[86],"achieve":[87],"this,":[88],"propose":[90],"outlining,":[92],"technique":[94],"intentionally":[96],"hide":[97],"of":[99,140],"from":[102],"optimizer,":[104],"resulting":[105],"simpler":[107],"UDFs":[108],"significantly":[110],"faster":[111],"plans.":[113],"Our":[114],"implementation":[115],"(PRISM)":[116],"demonstrates":[117],"outlining":[120],"improves":[121],"over":[123],"conventional":[124],"(on":[126],"average":[127],"1.29\u00d7":[128],"speedup":[129],"for":[130,134],"DuckDB":[131],"298.73\u00d7":[133],"Server)":[136],"through":[137],"combination":[139],"more":[141],"effective":[142],"unnesting,":[143],"improved":[144],"data":[145],"skipping,":[146],"avoiding":[149],"unnecessary":[150],"joins.":[151]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
