{"id":"https://openalex.org/W3013872119","doi":"https://doi.org/10.1007/s10766-020-00657-z","title":"Handling Data Skew for Aggregation in Spark SQL Using Task Stealing","display_name":"Handling Data Skew for Aggregation in Spark SQL Using Task Stealing","publication_year":2020,"publication_date":"2020-03-25","ids":{"openalex":"https://openalex.org/W3013872119","doi":"https://doi.org/10.1007/s10766-020-00657-z","mag":"3013872119"},"language":"en","primary_location":{"id":"doi:10.1007/s10766-020-00657-z","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s10766-020-00657-z","pdf_url":null,"source":{"id":"https://openalex.org/S148521650","display_name":"International Journal of Parallel Programming","issn_l":"0885-7458","issn":["0885-7458","1573-7640"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Parallel Programming","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064729057","display_name":"Zeyu He","orcid":"https://orcid.org/0000-0001-8017-2344"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zeyu He","raw_affiliation_strings":["School of Data Science and Engineering, East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Data Science and Engineering, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037156146","display_name":"Qiuli Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiuli Huang","raw_affiliation_strings":["School of Data Science and Engineering, East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Data Science and Engineering, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100656422","display_name":"Zhifang Li","orcid":"https://orcid.org/0000-0002-6090-0479"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhifang Li","raw_affiliation_strings":["School of Data Science and Engineering, East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Data Science and Engineering, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025387109","display_name":"Chuliang Weng","orcid":"https://orcid.org/0000-0003-0293-5857"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuliang Weng","raw_affiliation_strings":["School of Data Science and Engineering, East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Data Science and Engineering, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5064729057"],"corresponding_institution_ids":["https://openalex.org/I66867065"],"apc_list":{"value":2290,"currency":"EUR","value_usd":2890},"apc_paid":null,"fwci":0.6447,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.71121964,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"48","issue":"6","first_page":"941","last_page":"956"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8920161724090576},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.7647984623908997},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.7066089510917664},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6396808624267578},{"id":"https://openalex.org/keywords/skew","display_name":"Skew","score":0.5950015187263489},{"id":"https://openalex.org/keywords/theory-of-computation","display_name":"Theory of computation","score":0.5357429385185242},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.4188666045665741},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.41123461723327637},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.40366697311401367}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8920161724090576},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.7647984623908997},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.7066089510917664},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6396808624267578},{"id":"https://openalex.org/C43711488","wikidata":"https://www.wikidata.org/wiki/Q7534783","display_name":"Skew","level":2,"score":0.5950015187263489},{"id":"https://openalex.org/C24858836","wikidata":"https://www.wikidata.org/wiki/Q844718","display_name":"Theory of computation","level":2,"score":0.5357429385185242},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4188666045665741},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.41123461723327637},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.40366697311401367},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10766-020-00657-z","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s10766-020-00657-z","pdf_url":null,"source":{"id":"https://openalex.org/S148521650","display_name":"International Journal of Parallel Programming","issn_l":"0885-7458","issn":["0885-7458","1573-7640"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Parallel Programming","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1529847426","https://openalex.org/W1570320352","https://openalex.org/W2019380637","https://openalex.org/W2038412523","https://openalex.org/W2040842686","https://openalex.org/W2045725603","https://openalex.org/W2061601738","https://openalex.org/W2067089961","https://openalex.org/W2080131844","https://openalex.org/W2083630254","https://openalex.org/W2086977914","https://openalex.org/W2102967864","https://openalex.org/W2131975293","https://openalex.org/W2140509629","https://openalex.org/W2141267666","https://openalex.org/W2166418599","https://openalex.org/W2170544909","https://openalex.org/W2210299188","https://openalex.org/W2261536765","https://openalex.org/W2423220585","https://openalex.org/W2464834590","https://openalex.org/W2572141373","https://openalex.org/W2618868084","https://openalex.org/W2734430573","https://openalex.org/W2911536067"],"related_works":["https://openalex.org/W4290802965","https://openalex.org/W97789383","https://openalex.org/W3015859229","https://openalex.org/W3159871278","https://openalex.org/W2230552005","https://openalex.org/W2558523485","https://openalex.org/W4379407450","https://openalex.org/W2408437972","https://openalex.org/W2905107896","https://openalex.org/W2895375519"],"abstract_inverted_index":null,"counts_by_year":[{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
