{"id":"https://openalex.org/W2992496917","doi":"https://doi.org/10.14778/3368289.3368292","title":"Pushing data-induced predicates through joins in big-data clusters","display_name":"Pushing data-induced predicates through joins in big-data clusters","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W2992496917","doi":"https://doi.org/10.14778/3368289.3368292","mag":"2992496917"},"language":"en","primary_location":{"id":"doi:10.14778/3368289.3368292","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3368289.3368292","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023881736","display_name":"Srikanth Kandula","orcid":"https://orcid.org/0000-0001-9494-6435"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Srikanth Kandula","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054285881","display_name":"Laurel Orr","orcid":"https://orcid.org/0000-0002-2183-3541"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Laurel Orr","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038037154","display_name":"Surajit Chaudhuri","orcid":"https://orcid.org/0000-0001-8252-5270"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Surajit Chaudhuri","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5023881736"],"corresponding_institution_ids":["https://openalex.org/I4210164937"],"apc_list":null,"apc_paid":null,"fwci":2.4757,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":{"value":0.90385453,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"13","issue":"3","first_page":"252","last_page":"265"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/joins","display_name":"Joins","score":0.7679486274719238},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7199432849884033},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.5827779173851013},{"id":"https://openalex.org/keywords/predicate","display_name":"Predicate (mathematical logic)","score":0.49040675163269043},{"id":"https://openalex.org/keywords/statistic","display_name":"Statistic","score":0.4268028438091278},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.4168703854084015},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3714590072631836},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18442687392234802},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.17457649111747742},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.16528525948524475}],"concepts":[{"id":"https://openalex.org/C2778692605","wikidata":"https://www.wikidata.org/wiki/Q4041866","display_name":"Joins","level":2,"score":0.7679486274719238},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7199432849884033},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.5827779173851013},{"id":"https://openalex.org/C140146324","wikidata":"https://www.wikidata.org/wiki/Q1144319","display_name":"Predicate (mathematical logic)","level":2,"score":0.49040675163269043},{"id":"https://openalex.org/C89128539","wikidata":"https://www.wikidata.org/wiki/Q1949963","display_name":"Statistic","level":2,"score":0.4268028438091278},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.4168703854084015},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3714590072631836},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18442687392234802},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.17457649111747742},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.16528525948524475}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3368289.3368292","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3368289.3368292","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1576035775","https://openalex.org/W1971885140","https://openalex.org/W1972115340","https://openalex.org/W1973898816","https://openalex.org/W1981988185","https://openalex.org/W1985419898","https://openalex.org/W1993433750","https://openalex.org/W1999883293","https://openalex.org/W2006296837","https://openalex.org/W2022858489","https://openalex.org/W2026354416","https://openalex.org/W2071989194","https://openalex.org/W2073824505","https://openalex.org/W2079112936","https://openalex.org/W2080745194","https://openalex.org/W2087796842","https://openalex.org/W2098935637","https://openalex.org/W2102489964","https://openalex.org/W2110086534","https://openalex.org/W2111687586","https://openalex.org/W2119400430","https://openalex.org/W2120340025","https://openalex.org/W2122406210","https://openalex.org/W2146709231","https://openalex.org/W2151251992","https://openalex.org/W2170515491","https://openalex.org/W2243512312","https://openalex.org/W2252022677","https://openalex.org/W2294895103","https://openalex.org/W2396309311","https://openalex.org/W2548945327","https://openalex.org/W2567161013","https://openalex.org/W2583754181","https://openalex.org/W2612705754","https://openalex.org/W2615139629","https://openalex.org/W2756982556","https://openalex.org/W2798926543","https://openalex.org/W4255671299"],"related_works":["https://openalex.org/W2088925915","https://openalex.org/W2382891957","https://openalex.org/W2393491644","https://openalex.org/W2067184662","https://openalex.org/W3047837489","https://openalex.org/W2378924333","https://openalex.org/W2362446711","https://openalex.org/W1495801388","https://openalex.org/W2551308855","https://openalex.org/W1760549314"],"abstract_inverted_index":{"Using":[0,116],"data":[1,10,48,85,93,113],"statistics,":[2],"we":[3],"convert":[4],"predicates":[5,12],"on":[6,16],"a":[7,117,147],"table":[8],"into":[9],"induced":[11],"(diPs)":[13],"that":[14,40,98],"apply":[15,35,70],"the":[17,28,38,78,84,92,124,127,139,143],"joining":[18],"tables.":[19],"Doing":[20],"so":[21],"substantially":[22],"speeds":[23],"up":[24],"multi-relation":[25],"queries":[26,125],"because":[27],"benefits":[29],"of":[30,80,123,138],"predicate":[31],"pushdown":[32],"can":[33,133],"now":[34],"beyond":[36],"just":[37],"tables":[39],"have":[41,60],"predicates.":[42],"We":[43,66],"use":[44],"diPs":[45,54,71,81,90,100],"to":[46,56,69,88,111],"skip":[47,134],"exclusively":[49],"during":[50,63],"query":[51,64,74,140,145],"optimization;":[52],"i.e.,":[53],"lead":[55],"better":[57],"plans":[58],"and":[59,76,91,130],"no":[61],"overhead":[62],"execution.":[65],"study":[67],"how":[68,77],"for":[72],"complex":[73],"expressions":[75],"usefulness":[79],"varies":[82],"with":[83],"statistics":[86],"used":[87],"construct":[89],"distributions.":[94],"Our":[95],"results":[96],"show":[97],"building":[99],"using":[101],"zone-maps":[102],"which":[103],"are":[104],"already":[105],"maintained":[106],"in":[107,126,146],"today's":[108],"clusters":[109],"leads":[110],"sizable":[112],"skipping":[114],"gains.":[115],"new":[118],"(slightly":[119],"larger)":[120],"statistic,":[121],"50%":[122],"TPC-H,":[128],"TPC-DS":[129],"JoinOrder":[131],"benchmarks":[132],"at":[135],"least":[136],"33%":[137],"input.":[141],"Consequently,":[142],"median":[144],"production":[148],"big-data":[149],"cluster":[150],"finishes":[151],"roughly":[152],"2x":[153],"faster.":[154]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
