{"id":"https://openalex.org/W4406312294","doi":"https://doi.org/10.1007/s10994-024-06712-x","title":"Fast online feature selection in streaming data","display_name":"Fast online feature selection in streaming data","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4406312294","doi":"https://doi.org/10.1007/s10994-024-06712-x"},"language":"en","primary_location":{"id":"doi:10.1007/s10994-024-06712-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06712-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06712-x.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06712-x.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5099087693","display_name":"Yael Hochma","orcid":"https://orcid.org/0009-0007-2783-9665"},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Yael Hochma","raw_affiliation_strings":["Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel"],"affiliations":[{"raw_affiliation_string":"Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel","institution_ids":["https://openalex.org/I124227911"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066910344","display_name":"Mark Last","orcid":"https://orcid.org/0000-0003-0748-7918"},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Mark Last","raw_affiliation_strings":["Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel"],"affiliations":[{"raw_affiliation_string":"Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel","institution_ids":["https://openalex.org/I124227911"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5099087693"],"corresponding_institution_ids":["https://openalex.org/I124227911"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":14.0589,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.9837149,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"114","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7665243148803711},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.673258364200592},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6693261861801147},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6450209617614746},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5725148320198059},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.5206329226493835},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5193313360214233},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.5121273994445801},{"id":"https://openalex.org/keywords/data-stream-mining","display_name":"Data stream mining","score":0.5106392502784729},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4787539839744568},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.46817654371261597},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.4584715962409973},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.4512917995452881},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.44411033391952515},{"id":"https://openalex.org/keywords/concept-drift","display_name":"Concept drift","score":0.42877477407455444},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.4231216311454773},{"id":"https://openalex.org/keywords/streaming-data","display_name":"Streaming data","score":0.421084463596344},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.29227328300476074}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7665243148803711},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.673258364200592},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6693261861801147},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6450209617614746},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5725148320198059},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.5206329226493835},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5193313360214233},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.5121273994445801},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.5106392502784729},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4787539839744568},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.46817654371261597},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.4584715962409973},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.4512917995452881},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.44411033391952515},{"id":"https://openalex.org/C60777511","wikidata":"https://www.wikidata.org/wiki/Q3045002","display_name":"Concept drift","level":3,"score":0.42877477407455444},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.4231216311454773},{"id":"https://openalex.org/C2777611316","wikidata":"https://www.wikidata.org/wiki/Q39045282","display_name":"Streaming data","level":2,"score":0.421084463596344},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.29227328300476074},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10994-024-06712-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06712-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06712-x.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10994-024-06712-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06712-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06712-x.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320323051","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4406312294.pdf"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W121132053","https://openalex.org/W1228375242","https://openalex.org/W1968160919","https://openalex.org/W2008056655","https://openalex.org/W2018786844","https://openalex.org/W2068714596","https://openalex.org/W2128873747","https://openalex.org/W2136051823","https://openalex.org/W2148798622","https://openalex.org/W2467405173","https://openalex.org/W2520599539","https://openalex.org/W2585528949","https://openalex.org/W2608159125","https://openalex.org/W2620707422","https://openalex.org/W2786121076","https://openalex.org/W2847284300","https://openalex.org/W2886346162","https://openalex.org/W2911862380","https://openalex.org/W3010722974","https://openalex.org/W3021596612","https://openalex.org/W3036781224","https://openalex.org/W3047625343","https://openalex.org/W3080633080","https://openalex.org/W3104788453","https://openalex.org/W3105233635","https://openalex.org/W3144406059","https://openalex.org/W4233583441","https://openalex.org/W4236765470","https://openalex.org/W4283269374","https://openalex.org/W4289236186","https://openalex.org/W4313458371","https://openalex.org/W4315473677","https://openalex.org/W4315647634","https://openalex.org/W4393792513","https://openalex.org/W6675354045","https://openalex.org/W6680192438","https://openalex.org/W6681822384","https://openalex.org/W6926322744"],"related_works":["https://openalex.org/W4281572076","https://openalex.org/W2469699777","https://openalex.org/W2060628068","https://openalex.org/W3013371665","https://openalex.org/W2773951400","https://openalex.org/W4391093024","https://openalex.org/W4388036646","https://openalex.org/W3208495060","https://openalex.org/W2277307313","https://openalex.org/W1521014365"],"abstract_inverted_index":{"Abstract":[0],"The":[1],"challenge":[2],"of":[3,7,32,43,68,81,94,208,217,267],"getting":[4],"big":[5],"amounts":[6],"high-quality":[8],"labeled":[9,34],"data":[10,17,35,89,140,191,270,278],"is":[11,19],"compounded":[12],"by":[13,237],"the":[14,30,33,39,66,79,92,114,214,218,233,238,264],"fact":[15],"that":[16,196],"labeling":[18,51],"often":[20],"subjective":[21],"and":[22,41,55,72,128,144,155,173,184,201,253,274],"requires":[23,245],"significant":[24,63],"human":[25,44],"effort.":[26],"In":[27],"many":[28],"cases,":[29],"quality":[31],"depends":[36],"entirely":[37],"on":[38,123,137,257],"expertise":[40],"experience":[42],"annotators,":[45],"making":[46],"it":[47],"challenging":[48],"to":[49,161,190],"ensure":[50],"accuracy":[52,215,234],"in":[53,87,118,206,228,276],"large":[54],"dynamic":[56,277],"datasets.":[57,259],"Moreover,":[58,243],"there":[59],"may":[60,96],"be":[61],"a":[62,69,102],"delay":[64],"between":[65],"arrival":[67],"new":[70],"instance":[71],"its":[73],"manual":[74],"labeling.":[75],"This":[76],"paper":[77],"explores":[78],"use":[80],"fully":[82],"unsupervised":[83,179,202,239],"feature":[84,104,115,164,203,272],"selection":[85,105,165,204,275],"algorithms":[86,205],"non-stationary":[88],"streams,":[90,141],"where":[91],"importance":[93,116],"features":[95],"change":[97],"over":[98],"time.":[99],"We":[100,134,158],"introduce":[101],"novel":[103],"algorithm":[106],"called":[107],"Online":[108,153],"Fast":[109],"FEa-ture":[110],"SELection-OFFESEL,":[111],"which":[112,187,222],"calculates":[113],"scores":[117],"each":[119],"incoming":[120],"window":[121],"based":[122],"their":[124],"mean":[125],"normalized":[126],"values":[127],"without":[129],"using":[130,146,268],"any":[131],"class":[132],"labels.":[133],"evaluate":[135],"OFFESEL":[136,160,197,212,244],"17":[138],"benchmark":[139],"both":[142],"stationary":[143,258],"non-stationary,":[145],"popular":[147,178],"online":[148],"classifiers":[149],"like":[150,171,181],"PerceptronMask,":[151],"VFDT,":[152],"Boosting,":[154],"Linear":[156],"SVM.":[157],"compare":[159],"several":[162],"other":[163],"algorithms,":[166],"including":[167],"state-of-the-art":[168],"supervised":[169,200,219],"ones":[170,180],"FIRES":[172,220],"ABFS,":[174],"as":[175,177],"well":[176],"MCFS,":[182],"LS,":[183],"Max":[185,240,251],"Variance,":[186],"we":[188],"adapted":[189],"streams.":[192,279],"Our":[193],"results":[194],"indicate":[195],"outperforms":[198],"all":[199],"terms":[207],"classification":[209],"accuracy.":[210],"Specifically,":[211],"preserves":[213],"level":[216,235],"algorithm,":[221],"proved":[223],"more":[224],"accurate":[225],"than":[226,250],"ABFS":[227],"our":[229,261],"experiments,":[230],"while":[231],"maintaining":[232],"achieved":[236],"Variance":[241,252],"algorithm.":[242],"even":[246],"less":[247],"computation":[248],"time":[249],"shows":[254],"high":[255],"stability":[256],"Overall,":[260],"study":[262],"demonstrates":[263],"potential":[265],"benefits":[266],"unlabeled":[269],"for":[271],"ranking":[273]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
