{"id":"https://openalex.org/W2175806766","doi":"https://doi.org/10.1109/bigdata.2015.7363736","title":"Learning to accurately COUNT with query-driven predictive analytics","display_name":"Learning to accurately COUNT with query-driven predictive analytics","publication_year":2015,"publication_date":"2015-10-01","ids":{"openalex":"https://openalex.org/W2175806766","doi":"https://doi.org/10.1109/bigdata.2015.7363736","mag":"2175806766"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2015.7363736","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2015.7363736","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001331936","display_name":"Christos Anagnostopoulos","orcid":"https://orcid.org/0000-0003-1517-6757"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Christos Anagnostopoulos","raw_affiliation_strings":["School of Computing Science, University of Glasgow, UK, G12 8QQ"],"affiliations":[{"raw_affiliation_string":"School of Computing Science, University of Glasgow, UK, G12 8QQ","institution_ids":["https://openalex.org/I7882870"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052475427","display_name":"Peter Triantafillou","orcid":"https://orcid.org/0000-0002-5807-6011"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Peter Triantafillou","raw_affiliation_strings":["School of Computing Science, University of Glasgow, UK, G12 8QQ"],"affiliations":[{"raw_affiliation_string":"School of Computing Science, University of Glasgow, UK, G12 8QQ","institution_ids":["https://openalex.org/I7882870"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5001331936"],"corresponding_institution_ids":["https://openalex.org/I7882870"],"apc_list":null,"apc_paid":null,"fwci":1.1577,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.79283212,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8603807687759399},{"id":"https://openalex.org/keywords/cardinality","display_name":"Cardinality (data modeling)","score":0.8213742971420288},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.6011651158332825},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5343811511993408},{"id":"https://openalex.org/keywords/online-aggregation","display_name":"Online aggregation","score":0.5013537406921387},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.47479361295700073},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.42549169063568115},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.33836787939071655},{"id":"https://openalex.org/keywords/web-query-classification","display_name":"Web query classification","score":0.3352762460708618},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.32047978043556213},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.23060151934623718}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8603807687759399},{"id":"https://openalex.org/C87117476","wikidata":"https://www.wikidata.org/wiki/Q362383","display_name":"Cardinality (data modeling)","level":2,"score":0.8213742971420288},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.6011651158332825},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5343811511993408},{"id":"https://openalex.org/C24028149","wikidata":"https://www.wikidata.org/wiki/Q7094056","display_name":"Online aggregation","level":5,"score":0.5013537406921387},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.47479361295700073},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.42549169063568115},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.33836787939071655},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.3352762460708618},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.32047978043556213},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.23060151934623718},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata.2015.7363736","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2015.7363736","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.gla.ac.uk:110123","is_oa":false,"landing_page_url":"http://eprints.gla.ac.uk/view/author/30896.html>","pdf_url":null,"source":{"id":"https://openalex.org/S4210235606","display_name":"ENLIGHTEN (Jurnal Bimbingan dan Konseling Islam)","issn_l":"2622-8912","issn":["2622-8912","2622-8920"],"is_oa":false,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1581547316","https://openalex.org/W1595687138","https://openalex.org/W1679913846","https://openalex.org/W1990643970","https://openalex.org/W1994616650","https://openalex.org/W1999444602","https://openalex.org/W2018666252","https://openalex.org/W2018700273","https://openalex.org/W2022858489","https://openalex.org/W2029798546","https://openalex.org/W2045604576","https://openalex.org/W2049841622","https://openalex.org/W2078063397","https://openalex.org/W2078658761","https://openalex.org/W2089442574","https://openalex.org/W2097267430","https://openalex.org/W2098263691","https://openalex.org/W2099302642","https://openalex.org/W2113651538","https://openalex.org/W2114029045","https://openalex.org/W2120108467","https://openalex.org/W2131975293","https://openalex.org/W2144661390","https://openalex.org/W2150779766","https://openalex.org/W2151310484","https://openalex.org/W2159140866","https://openalex.org/W2162948416","https://openalex.org/W2212047990"],"related_works":["https://openalex.org/W1560919561","https://openalex.org/W2096359267","https://openalex.org/W3125756434","https://openalex.org/W2901901036","https://openalex.org/W1793997780","https://openalex.org/W2041106684","https://openalex.org/W1975198784","https://openalex.org/W2013069866","https://openalex.org/W1515687622","https://openalex.org/W2186703450"],"abstract_inverted_index":{"We":[0,69,88,115,247],"study":[1],"a":[2,71,102,117,229,249],"novel":[3],"solution":[4,17,200],"to":[5,41,49,151,244],"executing":[6],"aggregation":[7,97,136],"(and":[8],"specifically":[9],"COUNT)":[10,96],"queries":[11,65,137],"over":[12,52,202],"large-scale":[13],"data.":[14,54],"The":[15,187],"proposed":[16],"is":[18,58,101,196,219,242],"generally":[19],"applicable,":[20],"in":[21,29,31,192],"the":[22,77,91,128,139,153,156,179,183,197],"sense":[23],"that":[24,193,241],"it":[25,57,100,150,194],"can":[26,80],"be":[27,50,81],"deployed":[28],"environments":[30,204],"which":[32,205,218],"data":[33,43,108,185,224],"owners":[34],"may":[35,37],"or":[36],"not":[38],"restrict":[39],"access":[40],"their":[42,53,67,142],"and":[44,66,111,148,182,226,236,238,259,269],"allow":[45],"only":[46,198],"`aggregation":[47],"operators'":[48],"executed":[51],"For":[55],"this,":[56],"based":[59],"on":[60,90],"predictive":[61],"analytics,":[62,225],"driven":[63],"by":[64],"results.":[68],"propose":[70],"machine":[72],"learning":[73,169,212],"(ML)":[74],"framework":[75],"for":[76,83,105,112,171,214,222],"task":[78],"(which":[79],"adapted":[82],"different":[84],"aggregates":[85],"as":[86,99],"well).":[87],"focus":[89],"widely":[92],"used":[93],"set-cardinality":[94],"(i.e.,":[95],"operator,":[98],"fundamental":[103],"operator":[104],"both":[106,178],"internal":[107],"system":[109],"optimisations":[110],"aggregation-query":[113],"analytics.":[114],"contribute":[116],"novel,":[118],"query-driven":[119,199],"ML":[120,165],"model":[121,166],"whose":[122],"goals":[123],"are":[124],"to:":[125],"(i)":[126,195],"learn":[127],"query":[129,146],"space":[130],"(access":[131],"patterns),":[132],"(ii)":[133,209],"associate":[134],"(complex)":[135],"with":[138],"cardinality":[140,154],"of":[141,155,159,189,233,253],"results,":[143],"(iii)":[144,227],"define":[145],"similarity":[147],"use":[149],"predict":[152],"answer":[157],"set":[158],"an":[160],"ad-hoc":[161,216],"incoming":[162],"query.":[163],"Our":[164],"incorporates":[167],"incremental":[168,211],"algorithms":[170],"ensuring":[172],"high":[173],"prediction":[174,234],"accuracy":[175,235],"even":[176],"when":[177],"querying":[180],"patterns":[181],"underlying":[184],"change.":[186],"significance":[188],"contribution":[190],"lies":[191],"applicable":[201],"general":[203],"include":[206],"restricted-access":[207],"data,":[208],"offers":[210,228],"adjusted":[213],"arriving":[215],"queries,":[217],"well":[220],"suited":[221],"big":[223],"performance":[230,251],"(in":[231],"terms":[232],"time,":[237],"memory":[239],"requirements)":[240],"superior":[243],"data-centric":[245,264],"approaches.":[246],"provide":[248],"comprehensive":[250],"evaluation":[252],"our":[254],"model,":[255],"evaluating":[256],"its":[257],"sensitivity":[258],"comparative":[260],"advantages":[261],"versus":[262],"acclaimed":[263],"methods":[265],"(self-tuning":[266],"histograms,":[267],"sampling,":[268],"multidimensional":[270],"histograms).":[271]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":5},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
