{"id":"https://openalex.org/W2998950759","doi":"https://doi.org/10.1186/s40537-019-0279-z","title":"Decreasing the execution time of reducers by revising clustering based on the futuristic greedy approach","display_name":"Decreasing the execution time of reducers by revising clustering based on the futuristic greedy approach","publication_year":2020,"publication_date":"2020-01-09","ids":{"openalex":"https://openalex.org/W2998950759","doi":"https://doi.org/10.1186/s40537-019-0279-z","mag":"2998950759"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-019-0279-z","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-019-0279-z","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-019-0279-z","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-019-0279-z","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047122832","display_name":"Ali Bakhthemmat","orcid":null},"institutions":[{"id":"https://openalex.org/I133529467","display_name":"Sharif University of Technology","ror":"https://ror.org/024c2fq17","country_code":"IR","type":"education","lineage":["https://openalex.org/I133529467"]}],"countries":["IR"],"is_corresponding":true,"raw_author_name":"Ali Bakhthemmat","raw_affiliation_strings":["Kish International Campus, Sharif University of Technology, Tehran, Iran"],"affiliations":[{"raw_affiliation_string":"Kish International Campus, Sharif University of Technology, Tehran, Iran","institution_ids":["https://openalex.org/I133529467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033902274","display_name":"Mohammad Izadi","orcid":"https://orcid.org/0000-0003-3561-3942"},"institutions":[{"id":"https://openalex.org/I133529467","display_name":"Sharif University of Technology","ror":"https://ror.org/024c2fq17","country_code":"IR","type":"education","lineage":["https://openalex.org/I133529467"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Mohammad Izadi","raw_affiliation_strings":["Department of Computer Engineering, Sharif University of Technology, Tehran, Iran"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Sharif University of Technology, Tehran, Iran","institution_ids":["https://openalex.org/I133529467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5047122832"],"corresponding_institution_ids":["https://openalex.org/I133529467"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":1.5085,"has_fulltext":true,"cited_by_count":13,"citation_normalized_percentile":{"value":0.85922366,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"7","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8483395576477051},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7237612009048462},{"id":"https://openalex.org/keywords/reducer","display_name":"Reducer","score":0.6747758388519287},{"id":"https://openalex.org/keywords/execution-time","display_name":"Execution time","score":0.654194712638855},{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.5630272030830383},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.50057053565979},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.48990315198898315},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.4736781418323517},{"id":"https://openalex.org/keywords/phase","display_name":"Phase (matter)","score":0.4609091877937317},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4561152160167694},{"id":"https://openalex.org/keywords/running-time","display_name":"Running time","score":0.44695979356765747},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.44116368889808655},{"id":"https://openalex.org/keywords/dbscan","display_name":"DBSCAN","score":0.41643577814102173},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3766654431819916},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3524947166442871},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.18556436896324158},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.15538185834884644},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.13374575972557068},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.09617117047309875}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8483395576477051},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7237612009048462},{"id":"https://openalex.org/C2776985865","wikidata":"https://www.wikidata.org/wiki/Q26820931","display_name":"Reducer","level":2,"score":0.6747758388519287},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.654194712638855},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.5630272030830383},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.50057053565979},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.48990315198898315},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.4736781418323517},{"id":"https://openalex.org/C44280652","wikidata":"https://www.wikidata.org/wiki/Q104837","display_name":"Phase (matter)","level":2,"score":0.4609091877937317},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4561152160167694},{"id":"https://openalex.org/C3017489831","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Running time","level":2,"score":0.44695979356765747},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.44116368889808655},{"id":"https://openalex.org/C46576248","wikidata":"https://www.wikidata.org/wiki/Q1114630","display_name":"DBSCAN","level":5,"score":0.41643577814102173},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3766654431819916},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3524947166442871},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.18556436896324158},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.15538185834884644},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.13374575972557068},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.09617117047309875},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C147176958","wikidata":"https://www.wikidata.org/wiki/Q77590","display_name":"Civil engineering","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-019-0279-z","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-019-0279-z","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-019-0279-z","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:091aa5fa59634faf9d0457d23e311596","is_oa":true,"landing_page_url":"https://doaj.org/article/091aa5fa59634faf9d0457d23e311596","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 7, Iss 1, Pp 1-21 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-019-0279-z","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-019-0279-z","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-019-0279-z","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.550000011920929,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2998950759.pdf","grobid_xml":"https://content.openalex.org/works/W2998950759.grobid-xml"},"referenced_works_count":41,"referenced_works":["https://openalex.org/W1680797894","https://openalex.org/W1735916776","https://openalex.org/W1885124406","https://openalex.org/W1918839972","https://openalex.org/W1968160647","https://openalex.org/W1971596129","https://openalex.org/W1993972700","https://openalex.org/W2008286666","https://openalex.org/W2029728897","https://openalex.org/W2033403400","https://openalex.org/W2055903840","https://openalex.org/W2109275473","https://openalex.org/W2116762767","https://openalex.org/W2122370965","https://openalex.org/W2149373142","https://openalex.org/W2311355646","https://openalex.org/W2505839951","https://openalex.org/W2519564115","https://openalex.org/W2561675875","https://openalex.org/W2581190813","https://openalex.org/W2617160631","https://openalex.org/W2617904355","https://openalex.org/W2620864032","https://openalex.org/W2735941455","https://openalex.org/W2751422831","https://openalex.org/W2786065378","https://openalex.org/W2786189002","https://openalex.org/W2789168111","https://openalex.org/W2807639926","https://openalex.org/W2883711134","https://openalex.org/W2885588543","https://openalex.org/W2910000146","https://openalex.org/W2918668824","https://openalex.org/W2925286065","https://openalex.org/W2969722626","https://openalex.org/W2970121096","https://openalex.org/W3105265400","https://openalex.org/W4230355096","https://openalex.org/W4238634277","https://openalex.org/W6637349233","https://openalex.org/W6657951020"],"related_works":["https://openalex.org/W2187492663","https://openalex.org/W3000354920","https://openalex.org/W4290987788","https://openalex.org/W2368219397","https://openalex.org/W3004596345","https://openalex.org/W2959625647","https://openalex.org/W2503866109","https://openalex.org/W2314379296","https://openalex.org/W3168814018","https://openalex.org/W2186523764"],"abstract_inverted_index":{"Abstract":[0],"MapReduce":[1],"is":[2,59],"used":[3],"within":[4],"the":[5,24,34,44,52,65,72,76,83,92,97,102,106,111,114,123,130,147,150,153,163,168,171,177,192,196,204],"Hadoop":[6,73],"framework,":[7],"which":[8],"handles":[9],"two":[10],"important":[11],"tasks:":[12],"mapping":[13],"and":[14,20,50,94,175],"reducing.":[15],"Data":[16],"clustering":[17,49,178],"in":[18,71,86,158,162,207],"mappers":[19],"reducers":[21,135,154,166,174,180],"can":[22,30],"decrease":[23],"execution":[25,46,197],"time,":[26],"as":[27],"similar":[28,117],"data":[29,68,81],"be":[31],"assigned":[32,100,128],"to":[33,88,101,129,181],"same":[35],"reducer":[36],"with":[37],"one":[38],"key.":[39],"Our":[40,56,187],"proposed":[41,57,193],"method":[42,85],"decreases":[43],"overall":[45],"time":[47,198],"by":[48,141,199],"lowering":[51],"number":[53,172],"of":[54,61,91,113,173],"reducers.":[55,131,148],"algorithm":[58,194,206],"composed":[60],"five":[62],"phases.":[63],"In":[64,75,122,149],"first":[66],"phase,":[67,78,116,125,152,165],"are":[69,99,119,127,136],"stored":[70],"structure.":[74],"second":[77,115],"we":[79],"cluster":[80],"using":[82,105],"MR-DBSCAN-KD":[84],"order":[87],"determine":[89],"all":[90],"outliers":[93,98],"clusters.":[95],"Then,":[96],"existing":[103],"clusters":[104,118,126],"futuristic":[107],"greedy":[108],"method.":[109],"At":[110],"end":[112],"merged":[120],"together.":[121],"third":[124],"Note":[132],"that":[133,191],"fewer":[134],"required":[137],"for":[138],"this":[139],"task":[140],"applying":[142],"approximated":[143],"load":[144],"balancing":[145],"between":[146],"fourth":[151],"execute":[155],"their":[156,183],"jobs":[157,184],"each":[159],"cluster.":[160],"Eventually,":[161],"final":[164],"return":[167],"output.":[169],"Decreasing":[170],"revising":[176],"helped":[179],"perform":[182],"almost":[185],"simultaneously.":[186],"research":[188],"results":[189],"indicate":[190],"improves":[195],"about":[200],"3.9%":[201],"less":[202],"than":[203],"fastest":[205],"our":[208],"experiments.":[209]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":1}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
