{"id":"https://openalex.org/W2583182270","doi":"https://doi.org/10.1109/bigdata.2016.7840708","title":"Parallel clustering method for non-disjoint partitioning of large-scale data based on spark framework","display_name":"Parallel clustering method for non-disjoint partitioning of large-scale data based on spark framework","publication_year":2016,"publication_date":"2016-12-01","ids":{"openalex":"https://openalex.org/W2583182270","doi":"https://doi.org/10.1109/bigdata.2016.7840708","mag":"2583182270"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2016.7840708","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2016.7840708","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084395721","display_name":"Zayani Abir","orcid":null},"institutions":[{"id":"https://openalex.org/I237446400","display_name":"Institut Superieur de Gestion","ror":"https://ror.org/035fsmk47","country_code":"FR","type":"education","lineage":["https://openalex.org/I237446400"]},{"id":"https://openalex.org/I4210165976","display_name":"Institut Sup\u00e9rieur de Gestion","ror":"https://ror.org/05g9kje37","country_code":"MA","type":"education","lineage":["https://openalex.org/I4210165976"]}],"countries":["FR","MA"],"is_corresponding":true,"raw_author_name":"Abir Zayani","raw_affiliation_strings":["Institut Sup\u00e9rieur de Gestion, University of Tunis"],"affiliations":[{"raw_affiliation_string":"Institut Sup\u00e9rieur de Gestion, University of Tunis","institution_ids":["https://openalex.org/I237446400","https://openalex.org/I4210165976"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006094657","display_name":"Chiheb-Eddine Ben N\u2019Cir","orcid":"https://orcid.org/0000-0003-4014-8264"},"institutions":[{"id":"https://openalex.org/I83259278","display_name":"Manouba University","ror":"https://ror.org/0503ejf32","country_code":"TN","type":"education","lineage":["https://openalex.org/I83259278"]}],"countries":["TN"],"is_corresponding":false,"raw_author_name":"Chiheb-Eddine Ben N'Cir","raw_affiliation_strings":["ESEN University of Manouba"],"affiliations":[{"raw_affiliation_string":"ESEN University of Manouba","institution_ids":["https://openalex.org/I83259278"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110248637","display_name":"Nadia Essoussi","orcid":null},"institutions":[{"id":"https://openalex.org/I237446400","display_name":"Institut Superieur de Gestion","ror":"https://ror.org/035fsmk47","country_code":"FR","type":"education","lineage":["https://openalex.org/I237446400"]},{"id":"https://openalex.org/I4210165976","display_name":"Institut Sup\u00e9rieur de Gestion","ror":"https://ror.org/05g9kje37","country_code":"MA","type":"education","lineage":["https://openalex.org/I4210165976"]}],"countries":["FR","MA"],"is_corresponding":false,"raw_author_name":"Nadia Essoussi","raw_affiliation_strings":["Institut Sup\u00e9rieur de Gestion, University of Tunis"],"affiliations":[{"raw_affiliation_string":"Institut Sup\u00e9rieur de Gestion, University of Tunis","institution_ids":["https://openalex.org/I237446400","https://openalex.org/I4210165976"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5084395721"],"corresponding_institution_ids":["https://openalex.org/I237446400","https://openalex.org/I4210165976"],"apc_list":null,"apc_paid":null,"fwci":0.89,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.85446015,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"5211","issue":null,"first_page":"1064","last_page":"1069"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/disjoint-sets","display_name":"Disjoint sets","score":0.8802647590637207},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8242588043212891},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.796872615814209},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.6302425265312195},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5280417203903198},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.41996827721595764},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4196930229663849},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.39006760716438293},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2508392930030823},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.17021778225898743},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09442678093910217}],"concepts":[{"id":"https://openalex.org/C45340560","wikidata":"https://www.wikidata.org/wiki/Q215382","display_name":"Disjoint sets","level":2,"score":0.8802647590637207},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8242588043212891},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.796872615814209},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.6302425265312195},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5280417203903198},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.41996827721595764},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4196930229663849},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.39006760716438293},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2508392930030823},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.17021778225898743},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09442678093910217},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2016.7840708","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2016.7840708","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W128776091","https://openalex.org/W205409467","https://openalex.org/W1544966837","https://openalex.org/W1547566968","https://openalex.org/W1592690888","https://openalex.org/W1651093245","https://openalex.org/W1965563268","https://openalex.org/W1976860187","https://openalex.org/W1979679758","https://openalex.org/W1991099280","https://openalex.org/W1992419399","https://openalex.org/W2008043556","https://openalex.org/W2013344760","https://openalex.org/W2026680798","https://openalex.org/W2034616054","https://openalex.org/W2044719661","https://openalex.org/W2063372053","https://openalex.org/W2064909362","https://openalex.org/W2071177730","https://openalex.org/W2084049775","https://openalex.org/W2107117509","https://openalex.org/W2108399535","https://openalex.org/W2116762767","https://openalex.org/W2131975293","https://openalex.org/W2132904553","https://openalex.org/W2142489247","https://openalex.org/W2152910534","https://openalex.org/W2173213060","https://openalex.org/W2185136252","https://openalex.org/W2237006239","https://openalex.org/W2556629099","https://openalex.org/W2612166593","https://openalex.org/W4236642514","https://openalex.org/W4239540072","https://openalex.org/W6605268149","https://openalex.org/W6632600247","https://openalex.org/W6637231022","https://openalex.org/W6679815717","https://openalex.org/W6818663456"],"related_works":["https://openalex.org/W4256429076","https://openalex.org/W1971174658","https://openalex.org/W2099195351","https://openalex.org/W1975949872","https://openalex.org/W3159871278","https://openalex.org/W2230552005","https://openalex.org/W2905242764","https://openalex.org/W3109411864","https://openalex.org/W3017846737","https://openalex.org/W2348092930"],"abstract_inverted_index":{"Clustering":[0],"large":[1],"scale":[2],"data":[3,24,48,67],"has":[4,17],"become":[5],"an":[6],"important":[7],"challenge":[8],"which":[9,80,114],"motivates":[10],"several":[11,54],"recent":[12],"works.":[13],"While":[14],"the":[15,20,31,38,74,104,109],"emphasis":[16],"been":[18],"on":[19,118],"organization":[21],"of":[22,33,60,92,106,132],"massive":[23],"into":[25],"disjoint":[26,39],"groups,":[27],"this":[28,42,70],"work":[29],"considers":[30],"identification":[32],"non-disjoint":[34,63,90],"groups":[35,55],"rather":[36],"than":[37],"ones.":[40],"In":[41],"setting,":[43],"it":[44],"is":[45,81,97],"possible":[46],"for":[47],"object":[49],"to":[50,53,65,83,89,102,135],"belong":[51],"simultaneously":[52],"since":[56],"many":[57],"real-world":[58,121],"applications":[59],"clustering":[61,86,133],"require":[62],"partitioning":[64,91],"fit":[66],"structures.":[68],"For":[69],"purpose,":[71],"we":[72,115],"propose":[73],"Parallel":[75],"Overlapping":[76],"k-means":[77],"method":[78,96],"(POKM)":[79],"able":[82],"perform":[84],"parallel":[85],"processes":[87],"leading":[88],"data.":[93],"The":[94],"proposed":[95],"implemented":[98],"within":[99],"Spark":[100],"framework":[101],"ensure":[103],"distribution":[105],"works":[107],"over":[108],"different":[110],"computation":[111],"nodes.":[112],"Experiments":[113],"have":[116],"performed":[117],"simulated":[119],"and":[120,129],"multi-labeled":[122],"datasets":[123],"shows":[124],"both":[125],"faster":[126],"execution":[127],"times":[128],"high":[130],"quality":[131],"compared":[134],"existing":[136],"methods.":[137]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
