{"id":"https://openalex.org/W7117431406","doi":"https://doi.org/10.1007/s41019-025-00325-7","title":"SieveJoin: Boosting Multi-way Joins by Filtering Unneeded Intermediate Results","display_name":"SieveJoin: Boosting Multi-way Joins by Filtering Unneeded Intermediate Results","publication_year":2025,"publication_date":"2025-12-28","ids":{"openalex":"https://openalex.org/W7117431406","doi":"https://doi.org/10.1007/s41019-025-00325-7"},"language":"en","primary_location":{"id":"doi:10.1007/s41019-025-00325-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41019-025-00325-7","pdf_url":null,"source":{"id":"https://openalex.org/S2486411021","display_name":"Data Science and Engineering","issn_l":"2364-1185","issn":["2364-1185","2364-1541"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1007/s41019-025-00325-7","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069897977","display_name":"R. Li","orcid":"https://orcid.org/0009-0000-6572-5924"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Renrui Li","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089142532","display_name":"Qingzhi Ma","orcid":"https://orcid.org/0000-0003-2418-090X"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingzhi Ma","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121423905","display_name":"Xiaomeng Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I69356397","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05","country_code":"CN","type":"education","lineage":["https://openalex.org/I69356397"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaomeng Shi","raw_affiliation_strings":["IBSS, Xi\u2019an Jiaotong-Liverpool University, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"IBSS, Xi\u2019an Jiaotong-Liverpool University, Suzhou, China","institution_ids":["https://openalex.org/I69356397","https://openalex.org/I69356397"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5121438987","display_name":"An Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"An Liu","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, China","institution_ids":["https://openalex.org/I3923682"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5069897977"],"corresponding_institution_ids":["https://openalex.org/I3923682"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.65662583,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"11","issue":"1","first_page":"143","last_page":"154"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.6085000038146973,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.6085000038146973,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.09960000216960907,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.09480000287294388,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/joins","display_name":"Joins","score":0.9230999946594238},{"id":"https://openalex.org/keywords/bloom-filter","display_name":"Bloom filter","score":0.8199999928474426},{"id":"https://openalex.org/keywords/join","display_name":"Join (topology)","score":0.777999997138977},{"id":"https://openalex.org/keywords/tuple","display_name":"Tuple","score":0.6715999841690063},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6144999861717224},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.5539000034332275},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5004000067710876}],"concepts":[{"id":"https://openalex.org/C2778692605","wikidata":"https://www.wikidata.org/wiki/Q4041866","display_name":"Joins","level":2,"score":0.9230999946594238},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.902899980545044},{"id":"https://openalex.org/C147224247","wikidata":"https://www.wikidata.org/wiki/Q885373","display_name":"Bloom filter","level":2,"score":0.8199999928474426},{"id":"https://openalex.org/C2776124973","wikidata":"https://www.wikidata.org/wiki/Q3183033","display_name":"Join (topology)","level":2,"score":0.777999997138977},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.6715999841690063},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6144999861717224},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.5539000034332275},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5004000067710876},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.44279998540878296},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37549999356269836},{"id":"https://openalex.org/C2779172887","wikidata":"https://www.wikidata.org/wiki/Q184316","display_name":"PageRank","level":2,"score":0.36340001225471497},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.36239999532699585},{"id":"https://openalex.org/C188805328","wikidata":"https://www.wikidata.org/wiki/Q4060691","display_name":"Hash join","level":3,"score":0.3521000146865845},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.3239000141620636},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.31679999828338623},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.29280000925064087},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.271699994802475},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.2709999978542328},{"id":"https://openalex.org/C19012869","wikidata":"https://www.wikidata.org/wiki/Q578372","display_name":"Response time","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s41019-025-00325-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41019-025-00325-7","pdf_url":null,"source":{"id":"https://openalex.org/S2486411021","display_name":"Data Science and Engineering","issn_l":"2364-1185","issn":["2364-1185","2364-1541"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science and Engineering","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:47b3e90f21c246b0baa44e3181d3e0a8","is_oa":true,"landing_page_url":"https://doaj.org/article/47b3e90f21c246b0baa44e3181d3e0a8","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Data Science and Engineering, Vol 11, Iss 1, Pp 143-154 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s41019-025-00325-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41019-025-00325-7","pdf_url":null,"source":{"id":"https://openalex.org/S2486411021","display_name":"Data Science and Engineering","issn_l":"2364-1185","issn":["2364-1185","2364-1541"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science and Engineering","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.639065146446228}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W1558092379","https://openalex.org/W1973898816","https://openalex.org/W1979514837","https://openalex.org/W1982177147","https://openalex.org/W1982945449","https://openalex.org/W1999954067","https://openalex.org/W2001040824","https://openalex.org/W2003627696","https://openalex.org/W2008865455","https://openalex.org/W2015362435","https://openalex.org/W2023797161","https://openalex.org/W2037859435","https://openalex.org/W2046167302","https://openalex.org/W2048531653","https://openalex.org/W2067082782","https://openalex.org/W2072627547","https://openalex.org/W2097880677","https://openalex.org/W2102163972","https://openalex.org/W2103670492","https://openalex.org/W2104615308","https://openalex.org/W2111708605","https://openalex.org/W2123845384","https://openalex.org/W2132244350","https://openalex.org/W2134483537","https://openalex.org/W2145812340","https://openalex.org/W2150760714","https://openalex.org/W2156660460","https://openalex.org/W2159886933","https://openalex.org/W2161956202","https://openalex.org/W2167276970","https://openalex.org/W2168689650","https://openalex.org/W2244876453","https://openalex.org/W2292693431","https://openalex.org/W2612777267","https://openalex.org/W2613226836","https://openalex.org/W2794997248","https://openalex.org/W2798499404","https://openalex.org/W2800160956","https://openalex.org/W2963066364","https://openalex.org/W2964277307","https://openalex.org/W2970204999","https://openalex.org/W2980615028","https://openalex.org/W2982036057","https://openalex.org/W3023647491","https://openalex.org/W3028610005","https://openalex.org/W3094660140","https://openalex.org/W3116457585","https://openalex.org/W4233762723","https://openalex.org/W4244579861","https://openalex.org/W4247618959","https://openalex.org/W4248080722"],"related_works":[],"abstract_inverted_index":{"Improving":[0],"the":[1,29,41,56,70,89,93,126,142,150,161],"performance":[2],"of":[3,72,79,108,144,152],"data":[4],"systems":[5],"for":[6,69],"join":[7,24,73,90,114,183],"operations":[8],"has":[9,18],"long":[10],"been":[11,19],"a":[12,49,66,156,167,175,180],"critical":[13],"challenge.":[14],"Recently,":[15],"substantial":[16],"attention":[17],"focused":[20],"on":[21],"optimizing":[22],"multi-way":[23,62,131],"performance,":[25],"particularly":[26],"in":[27,188],"reducing":[28],"overhead":[30],"caused":[31],"by":[32],"generating":[33],"intermediate":[34,102,146],"tuples":[35],"that":[36],"do":[37],"not":[38],"contribute":[39],"to":[40,60,84,95,111,140],"final":[42],"result.":[43],"In":[44],"this":[45],"paper,":[46],"we":[47,154],"propose":[48],"novel":[50],"algorithm":[51],"called":[52],"SieveJoin,":[53,153],"which":[54],"extends":[55],"established":[57],"Bloomjoin":[58],"approach":[59],"support":[61],"joins.":[63],"SieveJoin":[64,80,109,173],"sets":[65],"new":[67],"benchmark":[68],"efficiency":[71],"query":[74],"execution.":[75],"A":[76],"key":[77],"innovation":[78],"is":[81,110],"its":[82,186],"ability":[83],"propagate":[85],"Bloom":[86,117,136],"filters":[87,137],"along":[88],"path,":[91],"allowing":[92],"system":[94],"terminate":[96],"early":[97],"and":[98,133,166,179,192],"avoid":[99],"producing":[100],"superfluous":[101],"results.":[103],"The":[104],"primary":[105],"design":[106],"objective":[107],"efficiently":[112],"estimate":[113],"results":[115,171],"using":[116,160],"filters,":[118],"while":[119],"maintaining":[120],"minimal":[121],"memory":[122,193],"overhead.":[123],"We":[124],"analyze":[125],"bottlenecks":[127],"associated":[128],"with":[129,174],"deferred":[130],"joins":[132],"detail":[134],"how":[135],"are":[138],"utilized":[139],"suppress":[141],"creation":[143],"redundant":[145],"tuples.":[147],"To":[148],"assess":[149],"effectiveness":[151],"conduct":[155],"comprehensive":[157],"experimental":[158],"evaluation":[159],"TPC-H":[162],"benchmark,":[163],"citation":[164],"datasets,":[165],"synthetic":[168],"dataset.":[169],"Our":[170],"compare":[172],"state-of-the-art":[176],"column-store":[177],"database":[178],"worst-case":[181],"optimal":[182],"algorithm,":[184],"highlighting":[185],"advantages":[187],"both":[189],"response":[190],"time":[191],"usage.":[194]},"counts_by_year":[],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-12-28T00:00:00"}
