{"id":"https://openalex.org/W1584368464","doi":"https://doi.org/10.1109/cybconf.2015.7175952","title":"Combining nearest neighbour classifiers based on small subsamples for big data analytics","display_name":"Combining nearest neighbour classifiers based on small subsamples for big data analytics","publication_year":2015,"publication_date":"2015-06-01","ids":{"openalex":"https://openalex.org/W1584368464","doi":"https://doi.org/10.1109/cybconf.2015.7175952","mag":"1584368464"},"language":"en","primary_location":{"id":"doi:10.1109/cybconf.2015.7175952","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cybconf.2015.7175952","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE 2nd International Conference on Cybernetics (CYBCONF)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054879396","display_name":"Bartosz Krawczyk","orcid":"https://orcid.org/0000-0002-9774-0106"},"institutions":[{"id":"https://openalex.org/I11923345","display_name":"Wroc\u0142aw University of Science and Technology","ror":"https://ror.org/008fyn775","country_code":"PL","type":"education","lineage":["https://openalex.org/I11923345"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Bartosz Krawczyk","raw_affiliation_strings":["Department of Systems and Computer Networks, Wroclaw University of Technology, Wroclaw, Poland","Dept. of Systems and Computer Networks, Wroc\u0142aw University of Technology, Poland"],"affiliations":[{"raw_affiliation_string":"Department of Systems and Computer Networks, Wroclaw University of Technology, Wroclaw, Poland","institution_ids":["https://openalex.org/I11923345"]},{"raw_affiliation_string":"Dept. of Systems and Computer Networks, Wroc\u0142aw University of Technology, Poland","institution_ids":["https://openalex.org/I11923345"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060936121","display_name":"Micha\u0142 Wo\u017aniak","orcid":"https://orcid.org/0000-0003-0146-4205"},"institutions":[{"id":"https://openalex.org/I11923345","display_name":"Wroc\u0142aw University of Science and Technology","ror":"https://ror.org/008fyn775","country_code":"PL","type":"education","lineage":["https://openalex.org/I11923345"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Michal Wozniak","raw_affiliation_strings":["Department of Systems and Computer Networks, Wroclaw University of Technology, Wroclaw, Poland","Dept. of Systems and Computer Networks, Wroc\u0142aw University of Technology, Poland"],"affiliations":[{"raw_affiliation_string":"Department of Systems and Computer Networks, Wroclaw University of Technology, Wroclaw, Poland","institution_ids":["https://openalex.org/I11923345"]},{"raw_affiliation_string":"Dept. of Systems and Computer Networks, Wroc\u0142aw University of Technology, Poland","institution_ids":["https://openalex.org/I11923345"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5054879396"],"corresponding_institution_ids":["https://openalex.org/I11923345"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02187256,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"2","issue":null,"first_page":"311","last_page":"316"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7678243517875671},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.6708582639694214},{"id":"https://openalex.org/keywords/nearest-neighbour","display_name":"Nearest neighbour","score":0.6404610276222229},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6235239505767822},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5894251465797424},{"id":"https://openalex.org/keywords/k-nearest-neighbors-algorithm","display_name":"k-nearest neighbors algorithm","score":0.5485341548919678},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5453909039497375},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5115752816200256},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.4945950210094452},{"id":"https://openalex.org/keywords/random-subspace-method","display_name":"Random subspace method","score":0.49257737398147583},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.4925578236579895},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4760332405567169},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.4522843062877655}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7678243517875671},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.6708582639694214},{"id":"https://openalex.org/C2983946233","wikidata":"https://www.wikidata.org/wiki/Q4088109","display_name":"Nearest neighbour","level":2,"score":0.6404610276222229},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6235239505767822},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5894251465797424},{"id":"https://openalex.org/C113238511","wikidata":"https://www.wikidata.org/wiki/Q1071612","display_name":"k-nearest neighbors algorithm","level":2,"score":0.5485341548919678},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5453909039497375},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5115752816200256},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.4945950210094452},{"id":"https://openalex.org/C106135958","wikidata":"https://www.wikidata.org/wiki/Q7291993","display_name":"Random subspace method","level":3,"score":0.49257737398147583},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.4925578236579895},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4760332405567169},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.4522843062877655},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cybconf.2015.7175952","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cybconf.2015.7175952","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE 2nd International Conference on Cybernetics (CYBCONF)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1505837402","https://openalex.org/W1947256441","https://openalex.org/W1985157189","https://openalex.org/W2001369369","https://openalex.org/W2013514562","https://openalex.org/W2029084939","https://openalex.org/W2032612527","https://openalex.org/W2038705219","https://openalex.org/W2057550598","https://openalex.org/W2068514419","https://openalex.org/W2070577942","https://openalex.org/W2081183038","https://openalex.org/W2087295784","https://openalex.org/W2094411935","https://openalex.org/W2112048775","https://openalex.org/W2132549764","https://openalex.org/W2151537585","https://openalex.org/W2164364358","https://openalex.org/W2574134800","https://openalex.org/W6602586656","https://openalex.org/W6640632634"],"related_works":["https://openalex.org/W1981866886","https://openalex.org/W2052615004","https://openalex.org/W3080944905","https://openalex.org/W2073883415","https://openalex.org/W2944292463","https://openalex.org/W3014252901","https://openalex.org/W2652414671","https://openalex.org/W2188759683","https://openalex.org/W4317376680","https://openalex.org/W4360777922"],"abstract_inverted_index":{"Contemporary":[0],"machine":[1],"learning":[2],"systems":[3],"must":[4],"be":[5],"able":[6],"to":[7,92,116,140,176],"deal":[8,70],"with":[9,71,149],"ever-growing":[10],"volumes":[11],"of":[12,16,33,65,80,87,99,122,127,159,170,192,196],"data.":[13,202],"However,":[14],"most":[15],"the":[17,66,85,97,125,145,157,168,193],"canonical":[18],"classifiers":[19,95],"are":[20,164],"not":[21,114],"well-suited":[22],"for":[23,45,50,166,188,200],"big":[24,51,201],"data":[25,52],"analytics.":[26],"This":[27],"is":[28,40],"especially":[29],"vivid":[30],"in":[31,182],"case":[32],"distance-based":[34,94],"classifiers,":[35],"where":[36],"their":[37],"classification":[38,153],"time":[39],"prohibitive.":[41],"Recently,":[42],"many":[43],"methods":[44],"adapting":[46],"nearest":[47,141,197],"neighbour":[48,142,198],"classifier":[49,143],"were":[53],"proposed.":[54],"We":[55,90,155],"investigate":[56,156],"simple,":[57],"yet":[58],"efficient":[59],"technique":[60],"based":[61,180],"on":[62,96],"random":[63],"under-sampling":[64],"dataset.":[67,89,172],"As":[68],"we":[69,130,174],"stationary":[72],"data,":[73],"one":[74,112],"may":[75],"assume":[76],"that":[77,132,163],"a":[78,150,183,189],"subset":[79],"objects":[81],"will":[82],"sufficiently":[83],"capture":[84],"properties":[86,169],"given":[88],"propose":[91,175],"build":[93],"basis":[98,126],"very":[100],"small":[101],"subsamples":[102],"and":[103],"then":[104],"combine":[105],"them":[106],"into":[107],"an":[108,134],"ensemble.":[109],"With":[110],"this,":[111],"does":[113],"need":[115],"aggregate":[117],"datasets,":[118],"only":[119],"local":[120],"decisions":[121],"classifiers.":[123],"On":[124],"experimental":[128],"results":[129,139],"show":[131],"such":[133],"approach":[135],"can":[136],"return":[137],"comparable":[138],"over":[144],"entire":[146],"dataset,":[147],"but":[148],"significantly":[151],"reduced":[152],"time.":[154],"number":[158],"sub-samples":[160],"(ensemble":[161],"members),":[162],"required":[165],"capturing":[167],"each":[171],"Finally,":[173],"apply":[177],"our":[178],"sub-sampling":[179],"ensemble":[181],"distributed":[184],"environment,":[185],"which":[186],"allows":[187],"further":[190],"reduction":[191],"computational":[194],"complexity":[195],"rule":[199]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
