{"id":"https://openalex.org/W2913287340","doi":"https://doi.org/10.1109/bigdata.2018.8622178","title":"A Sketch-Based Naive Bayes Algorithms for Evolving Data Streams","display_name":"A Sketch-Based Naive Bayes Algorithms for Evolving Data Streams","publication_year":2018,"publication_date":"2018-12-01","ids":{"openalex":"https://openalex.org/W2913287340","doi":"https://doi.org/10.1109/bigdata.2018.8622178","mag":"2913287340"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2018.8622178","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2018.8622178","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074483795","display_name":"Maroua Bahri","orcid":"https://orcid.org/0000-0002-7420-7464"},"institutions":[{"id":"https://openalex.org/I12356871","display_name":"T\u00e9l\u00e9com Paris","ror":"https://ror.org/01naq7912","country_code":"FR","type":"education","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210165912","display_name":"Laboratoire Traitement et Communication de l\u2019Information","ror":"https://ror.org/057er4c39","country_code":"FR","type":"facility","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102","https://openalex.org/I4210165912"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Maroua Bahri","raw_affiliation_strings":["LTCI, T\u00e9l\u00e9com ParisTech, Universit\u00e9 Paris-Saclay, Paris, France","INFRES - D\u00e9partement Informatique et R\u00e9seaux (46, rue Barrault \r\n75013 Paris - France)","DIG - Data, Intelligence and Graphs (T\u00e9l\u00e9com Paris 19 Place Marguerite Perey 91120 Palaiseau - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LTCI, T\u00e9l\u00e9com ParisTech, Universit\u00e9 Paris-Saclay, Paris, France","institution_ids":["https://openalex.org/I12356871","https://openalex.org/I277688954","https://openalex.org/I4210165912"]},{"raw_affiliation_string":"INFRES - D\u00e9partement Informatique et R\u00e9seaux (46, rue Barrault \r\n75013 Paris - France)","institution_ids":[]},{"raw_affiliation_string":"DIG - Data, Intelligence and Graphs (T\u00e9l\u00e9com Paris 19 Place Marguerite Perey 91120 Palaiseau - France)","institution_ids":["https://openalex.org/I12356871"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035115589","display_name":"Silviu Maniu","orcid":"https://orcid.org/0000-0002-8623-1533"},"institutions":[{"id":"https://openalex.org/I102197404","display_name":"Universit\u00e9 Paris-Sud","ror":"https://ror.org/028rypz17","country_code":"FR","type":"education","lineage":["https://openalex.org/I102197404"]},{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210144804","display_name":"Laboratoire de Recherche en Informatique","ror":"https://ror.org/04e3ktk27","country_code":"FR","type":"facility","lineage":["https://openalex.org/I102197404","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210144804","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Silviu Maniu","raw_affiliation_strings":["LRI, Universit\u00e9 Paris-Sud, Universit\u00e9 Paris-Saclay, Orsay, France","LaHDAK - LRI - Donn\u00e9es et Connaissances Massives et H\u00e9t\u00e9rog\u00e8nes (LRI) (Universit\u00e9 Paris-Saclay; B\u00e2t. 650 Lovelace ; 91405 Orsay Cedex - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LRI, Universit\u00e9 Paris-Sud, Universit\u00e9 Paris-Saclay, Orsay, France","institution_ids":["https://openalex.org/I277688954","https://openalex.org/I102197404","https://openalex.org/I4210144804"]},{"raw_affiliation_string":"LaHDAK - LRI - Donn\u00e9es et Connaissances Massives et H\u00e9t\u00e9rog\u00e8nes (LRI) (Universit\u00e9 Paris-Saclay; B\u00e2t. 650 Lovelace ; 91405 Orsay Cedex - France)","institution_ids":["https://openalex.org/I277688954","https://openalex.org/I4210144804"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080970505","display_name":"Albert Bifet","orcid":"https://orcid.org/0000-0002-8339-7773"},"institutions":[{"id":"https://openalex.org/I12356871","display_name":"T\u00e9l\u00e9com Paris","ror":"https://ror.org/01naq7912","country_code":"FR","type":"education","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210165912","display_name":"Laboratoire Traitement et Communication de l\u2019Information","ror":"https://ror.org/057er4c39","country_code":"FR","type":"facility","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102","https://openalex.org/I4210165912"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Albert Bifet","raw_affiliation_strings":["LTCI, T\u00e9l\u00e9com ParisTech, Universit\u00e9 Paris-Saclay, Paris, France","INFRES - D\u00e9partement Informatique et R\u00e9seaux (46, rue Barrault \r\n75013 Paris - France)","DIG - Data, Intelligence and Graphs (T\u00e9l\u00e9com Paris 19 Place Marguerite Perey 91120 Palaiseau - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LTCI, T\u00e9l\u00e9com ParisTech, Universit\u00e9 Paris-Saclay, Paris, France","institution_ids":["https://openalex.org/I12356871","https://openalex.org/I277688954","https://openalex.org/I4210165912"]},{"raw_affiliation_string":"INFRES - D\u00e9partement Informatique et R\u00e9seaux (46, rue Barrault \r\n75013 Paris - France)","institution_ids":[]},{"raw_affiliation_string":"DIG - Data, Intelligence and Graphs (T\u00e9l\u00e9com Paris 19 Place Marguerite Perey 91120 Palaiseau - France)","institution_ids":["https://openalex.org/I12356871"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.0275,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.90188461,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"604","last_page":"613"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9782999753952026,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.9653000235557556,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8550773859024048},{"id":"https://openalex.org/keywords/data-stream-mining","display_name":"Data stream mining","score":0.7248803377151489},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.6698378324508667},{"id":"https://openalex.org/keywords/concept-drift","display_name":"Concept drift","score":0.6635652780532837},{"id":"https://openalex.org/keywords/feature-hashing","display_name":"Feature hashing","score":0.6443538069725037},{"id":"https://openalex.org/keywords/data-stream","display_name":"Data stream","score":0.6002821922302246},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.5940515995025635},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.576103687286377},{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.553112804889679},{"id":"https://openalex.org/keywords/streaming-algorithm","display_name":"Streaming algorithm","score":0.551166296005249},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5237260460853577},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5185537934303284},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.5183566212654114},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48224005103111267},{"id":"https://openalex.org/keywords/streaming-data","display_name":"Streaming data","score":0.44454360008239746},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.324099600315094},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.2373611032962799},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.09713554382324219}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8550773859024048},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.7248803377151489},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.6698378324508667},{"id":"https://openalex.org/C60777511","wikidata":"https://www.wikidata.org/wiki/Q3045002","display_name":"Concept drift","level":3,"score":0.6635652780532837},{"id":"https://openalex.org/C133667856","wikidata":"https://www.wikidata.org/wiki/Q5439682","display_name":"Feature hashing","level":5,"score":0.6443538069725037},{"id":"https://openalex.org/C2778484313","wikidata":"https://www.wikidata.org/wiki/Q1172540","display_name":"Data stream","level":2,"score":0.6002821922302246},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.5940515995025635},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.576103687286377},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.553112804889679},{"id":"https://openalex.org/C187166803","wikidata":"https://www.wikidata.org/wiki/Q2835831","display_name":"Streaming algorithm","level":3,"score":0.551166296005249},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5237260460853577},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5185537934303284},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.5183566212654114},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48224005103111267},{"id":"https://openalex.org/C2777611316","wikidata":"https://www.wikidata.org/wiki/Q39045282","display_name":"Streaming data","level":2,"score":0.44454360008239746},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.324099600315094},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.2373611032962799},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.09713554382324219},{"id":"https://openalex.org/C138111711","wikidata":"https://www.wikidata.org/wiki/Q478351","display_name":"Double hashing","level":4,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata.2018.8622178","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2018.8622178","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-04507533v1","is_oa":false,"landing_page_url":"https://hal.science/hal-04507533","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2018 IEEE International Conference on Big Data (Big Data), Dec 2018, Seattle, United States. pp.604-613, &#x27E8;10.1109/BigData.2018.8622178&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W139562302","https://openalex.org/W1205641087","https://openalex.org/W1525647652","https://openalex.org/W1566376227","https://openalex.org/W1603920809","https://openalex.org/W1747560487","https://openalex.org/W1817561967","https://openalex.org/W1990079212","https://openalex.org/W1998749474","https://openalex.org/W2010657328","https://openalex.org/W2016023958","https://openalex.org/W2022858489","https://openalex.org/W2068714596","https://openalex.org/W2069980026","https://openalex.org/W2070845802","https://openalex.org/W2070996757","https://openalex.org/W2080234606","https://openalex.org/W2086364952","https://openalex.org/W2099419573","https://openalex.org/W2100406636","https://openalex.org/W2113459411","https://openalex.org/W2123845384","https://openalex.org/W2127939112","https://openalex.org/W2134125037","https://openalex.org/W2135335717","https://openalex.org/W2143991132","https://openalex.org/W2272111399","https://openalex.org/W2613161123","https://openalex.org/W2621345043","https://openalex.org/W2626498001","https://openalex.org/W2747485148","https://openalex.org/W2801183640","https://openalex.org/W2971503667","https://openalex.org/W3003253354","https://openalex.org/W3126614410","https://openalex.org/W6631547688","https://openalex.org/W6636209487","https://openalex.org/W6676984168","https://openalex.org/W6679969927","https://openalex.org/W6680192438"],"related_works":["https://openalex.org/W2981673118","https://openalex.org/W2759864402","https://openalex.org/W2601363847","https://openalex.org/W3093884210","https://openalex.org/W2060628068","https://openalex.org/W3006639312","https://openalex.org/W2940903377","https://openalex.org/W2761091637","https://openalex.org/W3000948009","https://openalex.org/W2365282734"],"abstract_inverted_index":{"A":[0],"well-known":[1,94],"learning":[2,50],"task":[3],"in":[4,13,17,46,53,72,97,141],"big":[5,192],"data":[6,23,45,68,127,140,193],"stream":[7,194],"mining":[8,195],"is":[9,31,58,70,144],"classification.":[10],"Extensively":[11],"studied":[12],"the":[14,18,36,44,49,54,64,93,101,106,123,150,190],"offline":[15,37],"setting,":[16,38,56],"streaming":[19,55,126],"setting":[20],"-":[21,29],"where":[22],"are":[24],"evolving":[25,86,130],"and":[26,83,131,215],"even":[27],"infinite":[28],"it":[30],"still":[32],"a":[33,153,163,170,175,185,198],"challenge.":[34],"In":[35],"training":[39,107],"needs":[40],"to":[41,60,63,99,104,120,158,162,169,189],"store":[42,105],"all":[43],"memory":[47,172],"for":[48,155],"task;":[51],"yet,":[52],"this":[57,80],"impossible":[59],"do":[61],"due":[62],"massive":[65],"amount":[66,200],"of":[67,201],"that":[69,125,160,180],"generated":[71],"real-time.":[73],"To":[74],"cope":[75],"with":[76,122],"these":[77,205],"resource":[78],"issues,":[79],"paper":[81],"proposes":[82],"analyzes":[84],"several":[85],"naive":[87],"Bayes":[88],"classification":[89],"algorithms,":[90],"based":[91],"on":[92,212],"count-min":[95],"sketch,":[96],"order":[98],"minimize":[100],"space":[102],"needed":[103],"data.":[108],"The":[109],"proposed":[110,182],"algorithms":[111,183,196],"also":[112],"adapt":[113],"concept":[114],"drift":[115],"approaches,":[116],"such":[117,142],"as":[118],"ADWIN,":[119],"deal":[121],"fact":[124],"may":[128],"be":[129],"change":[132],"over":[133],"time.":[134],"However,":[135],"handling":[136],"sparse,":[137],"very":[138],"high-dimensional":[139],"framework":[143],"highly":[145],"challenging.":[146],"Therefore,":[147],"we":[148],"include":[149],"hashing":[151],"trick,":[152],"technique":[154],"dimensionality":[156],"reduction,":[157],"compress":[159],"down":[161],"lower":[164],"dimensional":[165],"space,":[166],"which":[167,178],"leads":[168],"large":[171],"saving.We":[173],"give":[174],"theoretical":[176,206],"analysis":[177],"demonstrates":[179],"our":[181],"provide":[184],"similar":[186],"accuracy":[187],"quality":[188],"classical":[191],"using":[197],"reasonable":[199],"resources.":[202],"We":[203],"validate":[204],"results":[207],"by":[208],"an":[209],"extensive":[210],"evaluation":[211],"both":[213],"synthetic":[214],"real-world":[216],"datasets.":[217]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
