{"id":"https://openalex.org/W4416790793","doi":"https://doi.org/10.48550/arxiv.2511.21465","title":"Ensemble Performance Through the Lens of Linear Independence of Classifier Votes in Data Streams","display_name":"Ensemble Performance Through the Lens of Linear Independence of Classifier Votes in Data Streams","publication_year":2025,"publication_date":"2025-11-26","ids":{"openalex":"https://openalex.org/W4416790793","doi":"https://doi.org/10.48550/arxiv.2511.21465"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2511.21465","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.21465","pdf_url":"https://arxiv.org/pdf/2511.21465","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2511.21465","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092715591","display_name":"Enes Bektas","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bektas, Enes","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5086385685","display_name":"Fazl\u0131 Can","orcid":"https://orcid.org/0000-0003-0016-4278"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Can, Fazli","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5092715591"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9800999760627747,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9800999760627747,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.004699999932199717,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.002199999988079071,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.645799994468689},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.6226999759674072},{"id":"https://openalex.org/keywords/majority-rule","display_name":"Majority rule","score":0.5001999735832214},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.491100013256073},{"id":"https://openalex.org/keywords/independence","display_name":"Independence (probability theory)","score":0.45980000495910645},{"id":"https://openalex.org/keywords/random-subspace-method","display_name":"Random subspace method","score":0.4596000015735626},{"id":"https://openalex.org/keywords/cascading-classifiers","display_name":"Cascading classifiers","score":0.4499000012874603},{"id":"https://openalex.org/keywords/voting","display_name":"Voting","score":0.414900004863739}],"concepts":[{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.645799994468689},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.6226999759674072},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5932999849319458},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5034999847412109},{"id":"https://openalex.org/C153668964","wikidata":"https://www.wikidata.org/wiki/Q27636","display_name":"Majority rule","level":2,"score":0.5001999735832214},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.491100013256073},{"id":"https://openalex.org/C35651441","wikidata":"https://www.wikidata.org/wiki/Q625303","display_name":"Independence (probability theory)","level":2,"score":0.45980000495910645},{"id":"https://openalex.org/C106135958","wikidata":"https://www.wikidata.org/wiki/Q7291993","display_name":"Random subspace method","level":3,"score":0.4596000015735626},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.453000009059906},{"id":"https://openalex.org/C40651066","wikidata":"https://www.wikidata.org/wiki/Q5048220","display_name":"Cascading classifiers","level":4,"score":0.4499000012874603},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.414900004863739},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37959998846054077},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37540000677108765},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3693000078201294},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.3564000129699707},{"id":"https://openalex.org/C139532973","wikidata":"https://www.wikidata.org/wiki/Q2679259","display_name":"Linear classifier","level":3,"score":0.34529998898506165},{"id":"https://openalex.org/C70136482","wikidata":"https://www.wikidata.org/wiki/Q13583781","display_name":"A-weighting","level":3,"score":0.34450000524520874},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3059000074863434},{"id":"https://openalex.org/C43091099","wikidata":"https://www.wikidata.org/wiki/Q1067788","display_name":"Through-the-lens metering","level":3,"score":0.3043999969959259},{"id":"https://openalex.org/C119898033","wikidata":"https://www.wikidata.org/wiki/Q3433888","display_name":"Ensemble forecasting","level":2,"score":0.2782999873161316},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C41045048","wikidata":"https://www.wikidata.org/wiki/Q202843","display_name":"Linear programming","level":2,"score":0.2630999982357025},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.25870001316070557},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.25519999861717224}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2511.21465","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.21465","pdf_url":"https://arxiv.org/pdf/2511.21465","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2511.21465","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.21465","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2511.21465","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.21465","pdf_url":"https://arxiv.org/pdf/2511.21465","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4416790793.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Ensemble":[0],"learning":[1],"improves":[2],"classification":[3],"performance":[4,39,159],"by":[5],"combining":[6],"multiple":[7],"base":[8],"classifiers.":[9],"While":[10],"increasing":[11],"the":[12,33,41,72,78,85,101,116,156],"number":[13],"of":[14,43,57,74,87,115,125,158],"classifiers":[15,60],"generally":[16],"enhances":[17],"accuracy,":[18],"excessively":[19],"large":[20],"ensembles":[21,55,163],"can":[22,180],"lead":[23],"to":[24,77,111,120,189],"computational":[25],"inefficiency":[26],"and":[27,38,106,137,145,192],"diminishing":[28],"returns.":[29],"This":[30],"paper":[31],"investigates":[32],"relationship":[34],"between":[35,103],"ensemble":[36,104,117,142],"size":[37,105,118],"through":[40,132],"lens":[42],"linear":[44,75,89,126],"independence":[45,76,90],"among":[46,91],"classifier":[47,92],"votes":[48],"in":[49],"data":[50],"streams.":[51],"We":[52,69,128],"propose":[53],"that":[54,99,150,176],"composed":[56],"linearly":[58],"independent":[59],"maximize":[61],"representational":[62],"capacity,":[63],"particularly":[64],"under":[65],"a":[66,96,112,122],"geometric":[67],"model.":[68],"then":[70],"generalize":[71],"importance":[73],"weighted":[79],"majority":[80],"voting":[81],"problem.":[82],"By":[83],"modeling":[84],"probability":[86,124],"achieving":[88],"outputs,":[93],"we":[94],"derive":[95],"theoretical":[97,113,152,178],"framework":[98,174],"explains":[100],"trade-off":[102],"accuracy.":[107],"Our":[108,147,184],"analysis":[109],"leads":[110],"estimate":[114,153],"required":[119],"achieve":[121],"user-specified":[123],"independence.":[127],"validate":[129],"our":[130,173],"theory":[131],"experiments":[133],"on":[134],"both":[135],"real-world":[136],"synthetic":[138],"datasets":[139],"using":[140],"two":[141],"methods,":[143],"OzaBagging":[144],"GOOWE.":[146],"results":[148],"confirm":[149],"this":[151],"effectively":[154],"identifies":[155],"point":[157],"saturation":[160],"for":[161,167],"robust":[162],"like":[164,171],"OzaBagging.":[165],"Conversely,":[166],"complex":[168],"weighting":[169],"schemes":[170],"GOOWE,":[172],"reveals":[175],"high":[177],"diversity":[179],"trigger":[181],"algorithmic":[182],"instability.":[183],"implementation":[185],"is":[186],"publicly":[187],"available":[188],"support":[190],"reproducibility":[191],"future":[193],"research.":[194]},"counts_by_year":[],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2025-11-28T00:00:00"}
