{"id":"https://openalex.org/W4386043310","doi":"https://doi.org/10.14778/3611479.3611496","title":"Accelerating Aggregation Queries on Unstructured Streams of Data","display_name":"Accelerating Aggregation Queries on Unstructured Streams of Data","publication_year":2023,"publication_date":"2023-07-01","ids":{"openalex":"https://openalex.org/W4386043310","doi":"https://doi.org/10.14778/3611479.3611496"},"language":"en","primary_location":{"id":"doi:10.14778/3611479.3611496","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3611479.3611496","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2308.09157","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113228367","display_name":"Matthew Russo","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Matthew Russo","raw_affiliation_strings":["Stanford University"],"affiliations":[{"raw_affiliation_string":"Stanford University","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015518638","display_name":"Tatsunori Hashimoto","orcid":"https://orcid.org/0000-0003-0521-5855"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tatsunori Hashimoto","raw_affiliation_strings":["Stanford University"],"affiliations":[{"raw_affiliation_string":"Stanford University","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072348548","display_name":"Daniel Kang","orcid":"https://orcid.org/0000-0001-9860-9938"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Daniel Kang","raw_affiliation_strings":["University of Illinois Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101577180","display_name":"Yi Sun","orcid":"https://orcid.org/0000-0002-6124-4127"},"institutions":[{"id":"https://openalex.org/I40347166","display_name":"University of Chicago","ror":"https://ror.org/024mw5h28","country_code":"US","type":"education","lineage":["https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yi Sun","raw_affiliation_strings":["University of Chicago"],"affiliations":[{"raw_affiliation_string":"University of Chicago","institution_ids":["https://openalex.org/I40347166"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005554337","display_name":"Matei Zaharia","orcid":"https://orcid.org/0000-0002-7547-7204"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Matei Zaharia","raw_affiliation_strings":["Stanford University"],"affiliations":[{"raw_affiliation_string":"Stanford University","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5113228367"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":0.879,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.79095513,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"16","issue":"11","first_page":"2897","last_page":"2910"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8378332257270813},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.8009864687919617},{"id":"https://openalex.org/keywords/mean-squared-error","display_name":"Mean squared error","score":0.4973445236682892},{"id":"https://openalex.org/keywords/data-stream-mining","display_name":"Data stream mining","score":0.4959283769130707},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.4784241318702698},{"id":"https://openalex.org/keywords/inquest","display_name":"Inquest","score":0.4677804708480835},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.4461888074874878},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4326365888118744},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.11751636862754822},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.10487973690032959},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.0968087911605835}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8378332257270813},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.8009864687919617},{"id":"https://openalex.org/C139945424","wikidata":"https://www.wikidata.org/wiki/Q1940696","display_name":"Mean squared error","level":2,"score":0.4973445236682892},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.4959283769130707},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.4784241318702698},{"id":"https://openalex.org/C2780476252","wikidata":"https://www.wikidata.org/wiki/Q6036832","display_name":"Inquest","level":2,"score":0.4677804708480835},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.4461888074874878},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4326365888118744},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.11751636862754822},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.10487973690032959},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0968087911605835},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.14778/3611479.3611496","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3611479.3611496","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2308.09157","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2308.09157","pdf_url":"https://arxiv.org/pdf/2308.09157","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2308.09157","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2308.09157","pdf_url":"https://arxiv.org/pdf/2308.09157","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.8600000143051147,"id":"https://metadata.un.org/sdg/11"}],"awards":[{"id":"https://openalex.org/G1807707695","display_name":null,"funder_award_id":"51570","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G1861310076","display_name":null,"funder_award_id":"CNS-1651570","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6671297155","display_name":null,"funder_award_id":"CAREER","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320307791","display_name":"Cisco Systems","ror":"https://ror.org/03yt1ez60"},{"id":"https://openalex.org/F4320315389","display_name":"Open Philanthropy Project","ror":"https://ror.org/004d1k391"},{"id":"https://openalex.org/F4320315934","display_name":"Toyota Research Institute","ror":null},{"id":"https://openalex.org/F4320316785","display_name":"VMware","ror":null},{"id":"https://openalex.org/F4320330001","display_name":"Ant Financial Services Group","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4386043310.pdf","grobid_xml":"https://content.openalex.org/works/W4386043310.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W95608104","https://openalex.org/W1976821017","https://openalex.org/W1986319134","https://openalex.org/W2006722592","https://openalex.org/W2053154469","https://openalex.org/W2132520482","https://openalex.org/W2144200996","https://openalex.org/W2144771673","https://openalex.org/W2169593628","https://openalex.org/W2194775991","https://openalex.org/W2476844261","https://openalex.org/W2493916176","https://openalex.org/W2752236330","https://openalex.org/W2803764703","https://openalex.org/W2808184646","https://openalex.org/W2963150697","https://openalex.org/W2963341956","https://openalex.org/W2998032620","https://openalex.org/W2998752879","https://openalex.org/W3000318171","https://openalex.org/W3028942915","https://openalex.org/W3082972076","https://openalex.org/W3103442520","https://openalex.org/W3106402164","https://openalex.org/W3106772683","https://openalex.org/W3120920214","https://openalex.org/W3167312943","https://openalex.org/W3172687595","https://openalex.org/W3180149397","https://openalex.org/W3185475042","https://openalex.org/W3198567598","https://openalex.org/W4206547457","https://openalex.org/W4242954443","https://openalex.org/W4281739679","https://openalex.org/W4285190530","https://openalex.org/W4289866504","https://openalex.org/W4302338090"],"related_works":["https://openalex.org/W2097651754","https://openalex.org/W2077460601","https://openalex.org/W2163680304","https://openalex.org/W2106922085","https://openalex.org/W40054374","https://openalex.org/W2885392948","https://openalex.org/W2410666327","https://openalex.org/W2315703946","https://openalex.org/W4249308316","https://openalex.org/W2082830410"],"abstract_inverted_index":{"Analysts":[0],"and":[1,11,134,172,203,206],"scientists":[2],"are":[3],"interested":[4],"in":[5,48,166],"querying":[6,28],"streams":[7,119,185],"of":[8,54,87,96,103,120,141,151,178,245],"video,":[9],"audio,":[10],"text":[12,204],"to":[13,24,44,68,81,84,137,148,160,191,224,237],"extract":[14],"quantitative":[15],"insights.":[16],"For":[17],"example,":[18],"an":[19,142,162],"urban":[20],"planner":[21],"may":[22],"wish":[23],"measure":[25],"congestion":[26],"by":[27],"the":[29,49,61,69,85,94,139,152,157,175,192,211],"live":[30],"feed":[31],"from":[32],"a":[33,73,111,149,187,242,249],"traffic":[34],"camera.":[35],"Prior":[36],"work":[37,56,92,107],"has":[38],"used":[39],"deep":[40],"neural":[41],"networks":[42],"(DNNs)":[43],"answer":[45,165],"such":[46],"queries":[47,99,116],"batch":[50,251],"setting.":[51],"However,":[52],"much":[53],"this":[55,106],"is":[57,79],"not":[58],"suited":[59],"for":[60,113],"streaming":[62,220],"setting":[63,252],"because":[64],"it":[65],"requires":[66],"access":[67],"entire":[70],"dataset":[71],"before":[72],"query":[74,126,164,180],"can":[75,234],"be":[76],"submitted":[77],"or":[78],"specific":[80],"video.":[82],"Thus,":[83],"best":[86],"our":[88,197],"knowledge,":[89],"no":[90],"prior":[91],"addresses":[93],"problem":[95],"efficiently":[97],"answering":[98],"over":[100],"multiple":[101],"modalities":[102],"streams.":[104],"In":[105],"we":[108],"propose":[109],"InQuest,":[110],"system":[112],"accelerating":[114],"aggregation":[115],"on":[117,125,183,199],"unstructured":[118],"data":[121],"with":[122,222],"statistical":[123],"guarantees":[124],"accuracy.":[127],"InQuest":[128,171,209,233],"leverages":[129],"inexpensive":[130],"approximation":[131],"models":[132],"(\"proxies\")":[133],"sampling":[135],"techniques":[136],"limit":[138],"execution":[140],"expensive":[143],"high-precision":[144],"model":[145],"(an":[146],"\"oracle\")":[147],"subset":[150],"stream.":[153],"It":[154],"then":[155],"uses":[156],"oracle":[158,193,227,246],"predictions":[159],"compute":[161],"approximate":[163],"real-time.":[167],"We":[168,195,229],"theoretically":[169],"analyzed":[170],"show":[173,207,231],"that":[174,208,232],"expected":[176],"error":[177,216],"its":[179],"estimates":[181],"converges":[182],"stationary":[184],"at":[186,241],"rate":[188],"inversely":[189],"proportional":[190],"budget.":[194],"evaluated":[196],"algorithm":[198],"six":[200],"real-world":[201],"video":[202],"datasets":[205],"achieves":[210],"same":[212],"root":[213],"mean":[214],"squared":[215],"(RMSE)":[217],"as":[218],"two":[219],"baselines":[221],"up":[223,236],"5.0x":[225],"fewer":[226],"invocations.":[228],"further":[230],"achieve":[235],"1.9x":[238],"lower":[239],"RMSE":[240],"fixed":[243],"number":[244],"invocations":[247],"than":[248],"state-of-the-art":[250],"algorithm.":[253]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
