{"id":"https://openalex.org/W2367400316","doi":"https://doi.org/10.1145/2903220.2903255","title":"Efficient MapReduce Kernel k-Means for Big Data Clustering","display_name":"Efficient MapReduce Kernel k-Means for Big Data Clustering","publication_year":2016,"publication_date":"2016-05-11","ids":{"openalex":"https://openalex.org/W2367400316","doi":"https://doi.org/10.1145/2903220.2903255","mag":"2367400316"},"language":"en","primary_location":{"id":"doi:10.1145/2903220.2903255","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2903220.2903255","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th Hellenic Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084148416","display_name":"Nikolaos Tsapanos","orcid":"https://orcid.org/0000-0002-9470-7159"},"institutions":[{"id":"https://openalex.org/I21370196","display_name":"Aristotle University of Thessaloniki","ror":"https://ror.org/02j61yw88","country_code":"GR","type":"education","lineage":["https://openalex.org/I21370196"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Nikolaos Tsapanos","raw_affiliation_strings":["Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece","institution_ids":["https://openalex.org/I21370196"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041054091","display_name":"Anastasios Tefas","orcid":"https://orcid.org/0000-0003-1288-3667"},"institutions":[{"id":"https://openalex.org/I21370196","display_name":"Aristotle University of Thessaloniki","ror":"https://ror.org/02j61yw88","country_code":"GR","type":"education","lineage":["https://openalex.org/I21370196"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Anastasios Tefas","raw_affiliation_strings":["Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece","institution_ids":["https://openalex.org/I21370196"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034879808","display_name":"Nikos Nikolaidis","orcid":"https://orcid.org/0000-0003-1515-7986"},"institutions":[{"id":"https://openalex.org/I21370196","display_name":"Aristotle University of Thessaloniki","ror":"https://ror.org/02j61yw88","country_code":"GR","type":"education","lineage":["https://openalex.org/I21370196"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Nikolaos Nikolaidis","raw_affiliation_strings":["Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece","institution_ids":["https://openalex.org/I21370196"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061130224","display_name":"Ioannis Pitas","orcid":"https://orcid.org/0009-0006-7555-8641"},"institutions":[{"id":"https://openalex.org/I21370196","display_name":"Aristotle University of Thessaloniki","ror":"https://ror.org/02j61yw88","country_code":"GR","type":"education","lineage":["https://openalex.org/I21370196"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Ioannis Pitas","raw_affiliation_strings":["Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece","institution_ids":["https://openalex.org/I21370196"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5084148416"],"corresponding_institution_ids":["https://openalex.org/I21370196"],"apc_list":null,"apc_paid":null,"fwci":1.69126127,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.93134444,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7764495015144348},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6676180362701416},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.6583012342453003},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6546319723129272},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3887938857078552},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22916102409362793},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14517924189567566},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.054798245429992676}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7764495015144348},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6676180362701416},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.6583012342453003},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6546319723129272},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3887938857078552},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22916102409362793},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14517924189567566},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.054798245429992676}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2903220.2903255","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2903220.2903255","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th Hellenic Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320334626","display_name":"Medical Research Council","ror":"https://ror.org/03x94j517"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1526146785","https://openalex.org/W1607985379","https://openalex.org/W1978383016","https://openalex.org/W1979655058","https://openalex.org/W1992419399","https://openalex.org/W2019464758","https://openalex.org/W2025707345","https://openalex.org/W2026705124","https://openalex.org/W2028565608","https://openalex.org/W2034616054","https://openalex.org/W2035979693","https://openalex.org/W2036260704","https://openalex.org/W2039051707","https://openalex.org/W2047244756","https://openalex.org/W2051586153","https://openalex.org/W2057309387","https://openalex.org/W2093771778","https://openalex.org/W2135957668","https://openalex.org/W2140095548","https://openalex.org/W2155074104","https://openalex.org/W2165521059","https://openalex.org/W2173213060","https://openalex.org/W2652751060"],"related_works":["https://openalex.org/W4226091590","https://openalex.org/W1997217298","https://openalex.org/W2953411182","https://openalex.org/W4226459110","https://openalex.org/W2780362365","https://openalex.org/W4248689491","https://openalex.org/W3012677882","https://openalex.org/W2532266515","https://openalex.org/W3126395262","https://openalex.org/W2286998681"],"abstract_inverted_index":{"Data":[0],"clustering":[1,36,70,81,209,229,254],"is":[2,18,38,43,48,64,157,212],"an":[3,231],"unsupervised":[4],"learning":[5],"task":[6],"that":[7,168,185,211,238],"has":[8,104],"found":[9],"many":[10],"applications":[11],"in":[12,28,54,77,126,138,221],"various":[13],"scientific":[14],"fields.":[15],"The":[16,148,191,235],"goal":[17],"to":[19,51,79,122,140,161,183,188,223,226],"find":[20],"subgroups":[21],"of":[22,31,67,91,99,150,153,165,260],"closely":[23],"related":[24],"data":[25],"samples":[26,184],"(clusters)":[27],"a":[29,65,83,107,127,207],"set":[30],"unlabeled":[32],"data.":[33,102],"A":[34],"classic":[35,92],"algorithm":[37],"the":[39,56,68,74,89,95,100,115,124,135,142,154,163,166,169,176,181,199,239,246,261],"so-called":[40],"k-Means.":[41],"It":[42,103],"very":[44],"popular,":[45],"however,":[46],"it":[47],"also":[49,133],"unable":[50],"handle":[52],"cases":[53],"which":[55,72,218],"clusters":[57],"are":[58],"not":[59],"linearly":[60],"separable.":[61],"Kernel":[62,112,131,216,249],"k-Means":[63,93,132],"state":[66,259],"art":[69,262],"algorithm,":[71],"employs":[73,219],"kernel":[75,136,155,177,263],"trick,":[76],"order":[78,139,222],"perform":[80,228],"on":[82,214,230],"higher":[84],"dimensionality":[85],"space,":[86],"thus":[87],"overcoming":[88],"limitations":[90],"regarding":[94],"non":[96],"linear":[97],"separability":[98],"input":[101],"recently":[105],"received":[106],"distributed":[108,117,128,200,208],"implementation,":[109],"named":[110],"Trimmed":[111,130,215,248],"k-Means,":[113,217,250],"following":[114],"MapReduce":[116],"computing":[118,194],"model.":[119],"In":[120,202],"addition":[121],"performing":[123],"computations":[125],"manner,":[129],"trims":[134],"matrix,":[137],"reduce":[141],"memory":[143],"requirements":[144],"and":[145,174],"improve":[146],"performance.":[147],"trimming":[149],"each":[151],"row":[152],"matrix":[156,178],"achieved":[158],"by":[159],"attempting":[160],"estimate":[162],"cardinality":[164],"cluster":[167,193],"corresponding":[170],"sample":[171,182],"belongs":[172],"to,":[173],"removing":[175],"entries":[179],"connecting":[180],"probably":[186],"belong":[187],"another":[189],"cluster.":[190],"Spark":[192],"framework":[195],"was":[196],"used":[197],"for":[198],"implementation.":[201],"this":[203],"paper,":[204],"we":[205],"present":[206],"scheme":[210],"based":[213],"subsampling,":[220],"be":[224],"able":[225],"efficiently":[227],"extremely":[232],"large":[233],"dataset.":[234],"results":[236],"indicate":[237],"proposed":[240],"method":[241],"run":[242],"much":[243],"faster":[244],"than":[245],"original":[247],"while":[251],"still":[252],"providing":[253],"performance":[255],"competitive":[256],"with":[257],"other":[258],"approaches.":[264]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
