{"id":"https://openalex.org/W4312311177","doi":"https://doi.org/10.14778/3551793.3551867","title":"Enabling efficient and general subpopulation analytics in multidimensional data streams","display_name":"Enabling efficient and general subpopulation analytics in multidimensional data streams","publication_year":2022,"publication_date":"2022-07-01","ids":{"openalex":"https://openalex.org/W4312311177","doi":"https://doi.org/10.14778/3551793.3551867"},"language":"en","primary_location":{"id":"doi:10.14778/3551793.3551867","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3551793.3551867","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013987367","display_name":"Antonis Manousis","orcid":"https://orcid.org/0009-0003-8130-4435"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Antonis Manousis","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054211420","display_name":"Cheng Zhuo","orcid":"https://orcid.org/0000-0002-2610-7522"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhuo Cheng","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000201729","display_name":"Ran Ben Basat","orcid":"https://orcid.org/0000-0003-0196-9190"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ran Ben Basat","raw_affiliation_strings":["University College London"],"affiliations":[{"raw_affiliation_string":"University College London","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015818714","display_name":"Zaoxing Liu","orcid":"https://orcid.org/0000-0002-9119-1679"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zaoxing Liu","raw_affiliation_strings":["Boston University"],"affiliations":[{"raw_affiliation_string":"Boston University","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079175103","display_name":"Vyas Sekar","orcid":"https://orcid.org/0000-0001-5452-8976"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vyas Sekar","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5013987367"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":0.828,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.78155254,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"15","issue":"11","first_page":"3249","last_page":"3262"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7990995645523071},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.7097208499908447},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.7040502429008484},{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.5762678980827332},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5676106214523315},{"id":"https://openalex.org/keywords/memory-footprint","display_name":"Memory footprint","score":0.5260838270187378},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4398183226585388},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.434467613697052},{"id":"https://openalex.org/keywords/plug-in","display_name":"Plug-in","score":0.4166010022163391},{"id":"https://openalex.org/keywords/footprint","display_name":"Footprint","score":0.41393887996673584},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3569224178791046},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1453867256641388},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.11100390553474426}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7990995645523071},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.7097208499908447},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.7040502429008484},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.5762678980827332},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5676106214523315},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.5260838270187378},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4398183226585388},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.434467613697052},{"id":"https://openalex.org/C4924752","wikidata":"https://www.wikidata.org/wiki/Q184148","display_name":"Plug-in","level":2,"score":0.4166010022163391},{"id":"https://openalex.org/C132943942","wikidata":"https://www.wikidata.org/wiki/Q2562511","display_name":"Footprint","level":2,"score":0.41393887996673584},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3569224178791046},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1453867256641388},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.11100390553474426},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.14778/3551793.3551867","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3551793.3551867","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},{"id":"pmh:oai:null:2144/47059","is_oa":false,"landing_page_url":"https://www.webofscience.com/api/gateway?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000992390600075&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=6e74115fe3da270499c3d65c9b17d654","pdf_url":null,"source":{"id":"https://openalex.org/S4306402384","display_name":"OpenBU (Boston University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I111088046","host_organization_name":"Boston University","host_organization_lineage":["https://openalex.org/I111088046"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":null,"raw_type":"Conference materials"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":72,"referenced_works":["https://openalex.org/W95608104","https://openalex.org/W1541742946","https://openalex.org/W1546080482","https://openalex.org/W1590183325","https://openalex.org/W1971731845","https://openalex.org/W1972848834","https://openalex.org/W1998244781","https://openalex.org/W2010250346","https://openalex.org/W2022858489","https://openalex.org/W2024463287","https://openalex.org/W2025051251","https://openalex.org/W2038412523","https://openalex.org/W2040088116","https://openalex.org/W2057714068","https://openalex.org/W2064379477","https://openalex.org/W2071989194","https://openalex.org/W2074935284","https://openalex.org/W2077578097","https://openalex.org/W2078345533","https://openalex.org/W2080133348","https://openalex.org/W2080234606","https://openalex.org/W2082171780","https://openalex.org/W2084200885","https://openalex.org/W2098935637","https://openalex.org/W2099480861","https://openalex.org/W2100830825","https://openalex.org/W2110086534","https://openalex.org/W2115503987","https://openalex.org/W2119400430","https://openalex.org/W2119738171","https://openalex.org/W2122646361","https://openalex.org/W2133910774","https://openalex.org/W2139054829","https://openalex.org/W2141742398","https://openalex.org/W2144261930","https://openalex.org/W2152029707","https://openalex.org/W2153399951","https://openalex.org/W2153972927","https://openalex.org/W2156660460","https://openalex.org/W2164507334","https://openalex.org/W2284530523","https://openalex.org/W2293308125","https://openalex.org/W2294581520","https://openalex.org/W2294895103","https://openalex.org/W2296677182","https://openalex.org/W2394680079","https://openalex.org/W2421547754","https://openalex.org/W2487095677","https://openalex.org/W2542459869","https://openalex.org/W2613577383","https://openalex.org/W2613751718","https://openalex.org/W2737988660","https://openalex.org/W2743027853","https://openalex.org/W2744538883","https://openalex.org/W2795530455","https://openalex.org/W2809244162","https://openalex.org/W2878215196","https://openalex.org/W2948371369","https://openalex.org/W2948791565","https://openalex.org/W3004286518","https://openalex.org/W3017778882","https://openalex.org/W3046351827","https://openalex.org/W3081937877","https://openalex.org/W3089269561","https://openalex.org/W3100965700","https://openalex.org/W3176348316","https://openalex.org/W4238584892","https://openalex.org/W4242587584","https://openalex.org/W4246444773","https://openalex.org/W4289258943","https://openalex.org/W4402262144","https://openalex.org/W6712120708"],"related_works":["https://openalex.org/W2378994405","https://openalex.org/W2385974820","https://openalex.org/W2373478030","https://openalex.org/W2378679551","https://openalex.org/W3149739944","https://openalex.org/W2392363776","https://openalex.org/W2063051341","https://openalex.org/W3013442081","https://openalex.org/W3137434606","https://openalex.org/W4372263373"],"abstract_inverted_index":{"Today's":[0],"large-scale":[1],"services":[2],"(":[3],"e.g.":[4],",":[5],"video":[6],"streaming":[7],"platforms,":[8],"data":[9,48],"centers,":[10],"sensor":[11],"grids)":[12],"need":[13,57],"diverse":[14],"real-time":[15],"summary":[16,54],"statistics":[17,55],"across":[18],"multiple":[19,97,118],"subpopulations":[20,49,88],"of":[21,47,53,75,79,85,137,143],"multidimensional":[22,68,122],"datasets.":[23],"However,":[24],"state-of-the-art":[25],"frameworks":[26,151],"do":[27],"not":[28],"offer":[29],"general":[30],"and":[31,50,89,107,120,133,146],"accurate":[32,94],"analytics":[33,69],"in":[34,141],"real":[35],"time":[36],"at":[37,115],"reasonable":[38],"costs.":[39],"The":[40],"root":[41],"cause":[42],"is":[43,134],"the":[44,51,83],"combinatorial":[45],"explosion":[46],"diversity":[52],"we":[56,124],"to":[58,81,92,112],"monitor":[59],"simultaneously.":[60],"We":[61,99],"present":[62],"Hydra,":[63],"an":[64,103,135],"efficient":[65,140],"framework":[66],"for":[67,96],"that":[70,126],"presents":[71],"a":[72,77],"novel":[73],"combination":[74],"using":[76],"\"sketch":[78],"sketches\"":[80],"avoid":[82],"overhead":[84],"monitoring":[86],"exponentially-many":[87],"universal":[90],"sketching":[91],"ensure":[93],"estimates":[95],"statistics.":[98],"build":[100],"Hydra":[101,127],"as":[102],"Apache":[104],"Spark":[105],"plugin":[106],"address":[108],"practical":[109],"system":[110],"challenges":[111],"minimize":[113],"overheads":[114],"scale.":[116],"Across":[117],"real-world":[119],"synthetic":[121],"datasets,":[123],"show":[125],"can":[128],"achieve":[129],"robust":[130],"error":[131],"bounds":[132],"order":[136],"magnitude":[138],"more":[139],"terms":[142],"operational":[144],"cost":[145],"memory":[147],"footprint":[148],"than":[149],"existing":[150],"(e.g.,":[152],"Spark,":[153],"Druid)":[154],"while":[155],"ensuring":[156],"interactive":[157],"estimation":[158],"times.":[159]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
