{"id":"https://openalex.org/W2343623344","doi":"https://doi.org/10.1109/tpds.2016.2560176","title":"FiDoop-DP: Data Partitioning in Frequent Itemset Mining on Hadoop Clusters","display_name":"FiDoop-DP: Data Partitioning in Frequent Itemset Mining on Hadoop Clusters","publication_year":2016,"publication_date":"2016-04-29","ids":{"openalex":"https://openalex.org/W2343623344","doi":"https://doi.org/10.1109/tpds.2016.2560176","mag":"2343623344"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2016.2560176","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2016.2560176","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085599561","display_name":"Yaling Xun","orcid":"https://orcid.org/0000-0002-9590-6619"},"institutions":[{"id":"https://openalex.org/I46305995","display_name":"Taiyuan University of Science and Technology","ror":"https://ror.org/01wcbdc92","country_code":"CN","type":"education","lineage":["https://openalex.org/I46305995"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yaling Xun","raw_affiliation_strings":["Taiyuan University of Science and Technology, Taiyuan, Shanxi, China"],"affiliations":[{"raw_affiliation_string":"Taiyuan University of Science and Technology, Taiyuan, Shanxi, China","institution_ids":["https://openalex.org/I46305995"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046188958","display_name":"Jifu Zhang","orcid":"https://orcid.org/0000-0002-0396-8901"},"institutions":[{"id":"https://openalex.org/I46305995","display_name":"Taiyuan University of Science and Technology","ror":"https://ror.org/01wcbdc92","country_code":"CN","type":"education","lineage":["https://openalex.org/I46305995"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jifu Zhang","raw_affiliation_strings":["Taiyuan University of Science and Technology, Taiyuan, Shanxi, China"],"affiliations":[{"raw_affiliation_string":"Taiyuan University of Science and Technology, Taiyuan, Shanxi, China","institution_ids":["https://openalex.org/I46305995"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042766429","display_name":"Xiao Qin","orcid":"https://orcid.org/0000-0002-8345-3587"},"institutions":[{"id":"https://openalex.org/I82497590","display_name":"Auburn University","ror":"https://ror.org/02v80fc35","country_code":"US","type":"education","lineage":["https://openalex.org/I82497590"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiao Qin","raw_affiliation_strings":["Department of Computer Science and Software Engineering, Samuel Ginn College of Engineering, Auburn University, AL"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Software Engineering, Samuel Ginn College of Engineering, Auburn University, AL","institution_ids":["https://openalex.org/I82497590"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022687130","display_name":"Xujun Zhao","orcid":"https://orcid.org/0000-0003-2723-2613"},"institutions":[{"id":"https://openalex.org/I46305995","display_name":"Taiyuan University of Science and Technology","ror":"https://ror.org/01wcbdc92","country_code":"CN","type":"education","lineage":["https://openalex.org/I46305995"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xujun Zhao","raw_affiliation_strings":["Taiyuan University of Science and Technology, Taiyuan, Shanxi, China"],"affiliations":[{"raw_affiliation_string":"Taiyuan University of Science and Technology, Taiyuan, Shanxi, China","institution_ids":["https://openalex.org/I46305995"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5085599561"],"corresponding_institution_ids":["https://openalex.org/I46305995"],"apc_list":null,"apc_paid":null,"fwci":17.313,"has_fulltext":false,"cited_by_count":66,"citation_normalized_percentile":{"value":0.99021194,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"28","issue":"1","first_page":"101","last_page":"114"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9860000014305115,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8647000193595886},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.6075344681739807},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5307735800743103},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5010449886322021},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.4964311718940735},{"id":"https://openalex.org/keywords/node","display_name":"Node (physics)","score":0.4932062029838562},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4851034879684448},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4649689495563507},{"id":"https://openalex.org/keywords/consistent-hashing","display_name":"Consistent hashing","score":0.44969093799591064},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4474574625492096},{"id":"https://openalex.org/keywords/ibm","display_name":"IBM","score":0.43234118819236755},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.41877281665802},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.41231846809387207},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.3870580196380615},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.2117041051387787}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8647000193595886},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.6075344681739807},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5307735800743103},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5010449886322021},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.4964311718940735},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.4932062029838562},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4851034879684448},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4649689495563507},{"id":"https://openalex.org/C56856351","wikidata":"https://www.wikidata.org/wiki/Q1757218","display_name":"Consistent hashing","level":5,"score":0.44969093799591064},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4474574625492096},{"id":"https://openalex.org/C70388272","wikidata":"https://www.wikidata.org/wiki/Q5968558","display_name":"IBM","level":2,"score":0.43234118819236755},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.41877281665802},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.41231846809387207},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.3870580196380615},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.2117041051387787},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138111711","wikidata":"https://www.wikidata.org/wiki/Q478351","display_name":"Double hashing","level":4,"score":0.0},{"id":"https://openalex.org/C171250308","wikidata":"https://www.wikidata.org/wiki/Q11468","display_name":"Nanotechnology","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2016.2560176","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2016.2560176","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2303423109","display_name":null,"funder_award_id":"CCF-0845257","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3347073512","display_name":null,"funder_award_id":"61572343","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8650369768","display_name":null,"funder_award_id":"61272263","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W596485744","https://openalex.org/W603723648","https://openalex.org/W1481392940","https://openalex.org/W1544119352","https://openalex.org/W1547205936","https://openalex.org/W1736726159","https://openalex.org/W1964050638","https://openalex.org/W1981420413","https://openalex.org/W1991789623","https://openalex.org/W1992540139","https://openalex.org/W1994408342","https://openalex.org/W1995797177","https://openalex.org/W1997375126","https://openalex.org/W2004748427","https://openalex.org/W2011430131","https://openalex.org/W2018378172","https://openalex.org/W2027168615","https://openalex.org/W2049003051","https://openalex.org/W2056910091","https://openalex.org/W2071572981","https://openalex.org/W2073459066","https://openalex.org/W2081193615","https://openalex.org/W2090452820","https://openalex.org/W2097225630","https://openalex.org/W2102294813","https://openalex.org/W2105768086","https://openalex.org/W2112163170","https://openalex.org/W2112427676","https://openalex.org/W2133741724","https://openalex.org/W2142025585","https://openalex.org/W2150013559","https://openalex.org/W2158056686","https://openalex.org/W2161160262","https://openalex.org/W2164604674","https://openalex.org/W2173213060","https://openalex.org/W2189465200","https://openalex.org/W2277129084","https://openalex.org/W2542364126","https://openalex.org/W2543608830","https://openalex.org/W2916569980","https://openalex.org/W2953019775","https://openalex.org/W3104181340","https://openalex.org/W4254750692","https://openalex.org/W4300601563","https://openalex.org/W6632659161","https://openalex.org/W6668990524","https://openalex.org/W6674988879","https://openalex.org/W6687322159","https://openalex.org/W6729140741"],"related_works":["https://openalex.org/W2126795708","https://openalex.org/W2185281229","https://openalex.org/W3006522618","https://openalex.org/W1931672330","https://openalex.org/W2734989238","https://openalex.org/W4385261619","https://openalex.org/W4251536634","https://openalex.org/W2059096784","https://openalex.org/W1750955152","https://openalex.org/W1551533237"],"abstract_inverted_index":{"Traditional":[0],"parallel":[1,34,92,199],"algorithms":[2],"for":[3],"mining":[4,54],"frequent":[5],"itemsets":[6],"aim":[7],"to":[8,87,134,175,204],"balance":[9],"load":[10],"by":[11,25,57,68,154,161,181,202],"equally":[12],"partitioning":[13,44,72,109],"data":[14,43,71,108,132],"among":[15,61,114],"a":[16,27,40,70,131,149,155],"group":[17],"of":[18,31,84,91,102,142,158,184,196,210],"computing":[19,62,179],"nodes.":[20,63,190],"We":[21,64,145],"start":[22],"this":[23,66],"study":[24],"discovering":[26],"serious":[28],"performance":[29,90,195],"problem":[30,67],"the":[32,47,77,89,100,105,117,121,182,194,197],"existing":[33,48,198],"Frequent":[35,93],"Itemset":[36,94],"Mining":[37,95],"algorithms.":[38],"Given":[39],"large":[41],"dataset,":[42],"strategies":[45],"in":[46],"solutions":[49],"suffer":[50],"high":[51],"communication":[52],"and":[53,120,178],"overhead":[55],"induced":[56],"redundant":[58,143,186],"transactions":[59,129,187],"transmitted":[60],"address":[65],"developing":[69],"approach":[73],"called":[74],"FiDoop-DP":[75,85,103,125,147,172,191],"using":[76],"MapReduce":[78],"programming":[79],"model.":[80],"The":[81],"overarching":[82],"goal":[83],"is":[86,104,173],"boost":[88],"on":[96,148,188],"Hadoop":[97,151,189],"clusters.":[98],"At":[99],"heart":[101],"Voronoi":[106],"diagram-based":[107],"technique,":[110,124],"which":[111],"exploits":[112],"correlations":[113],"transactions.":[115,144],"Incorporating":[116],"similarity":[118],"metric":[119],"Locality-Sensitive":[122],"Hashing":[123],"places":[126],"highly":[127],"similar":[128],"into":[130],"partition":[133],"improve":[135],"locality":[136],"without":[137],"creating":[138],"an":[139,208],"excessive":[140],"number":[141],"implement":[146],"24-node":[150],"cluster,":[152],"driven":[153],"wide":[156],"range":[157],"datasets":[159],"created":[160],"IBM":[162],"Quest":[163],"Market-Basket":[164],"Synthetic":[165],"Data":[166],"Generator.":[167],"Experimental":[168],"results":[169],"reveal":[170],"that":[171],"conducive":[174],"reducing":[176],"network":[177],"loads":[180],"virtue":[183],"eliminating":[185],"significantly":[192],"improves":[193],"frequent-pattern":[200],"scheme":[201],"up":[203],"31":[205],"percent":[206],"with":[207],"average":[209],"18":[211],"percent.":[212]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":11},{"year":2017,"cited_by_count":4}],"updated_date":"2026-03-15T09:29:46.208133","created_date":"2025-10-10T00:00:00"}
