{"id":"https://openalex.org/W2773326840","doi":"https://doi.org/10.1109/tbdata.2017.2782785","title":"Handling Big Data Using a Data-Aware HDFS and Evolutionary Clustering Technique","display_name":"Handling Big Data Using a Data-Aware HDFS and Evolutionary Clustering Technique","publication_year":2017,"publication_date":"2017-12-13","ids":{"openalex":"https://openalex.org/W2773326840","doi":"https://doi.org/10.1109/tbdata.2017.2782785","mag":"2773326840"},"language":"en","primary_location":{"id":"doi:10.1109/tbdata.2017.2782785","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbdata.2017.2782785","pdf_url":null,"source":{"id":"https://openalex.org/S2491400915","display_name":"IEEE Transactions on Big Data","issn_l":"2332-7790","issn":["2332-7790","2372-2096"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000673075","display_name":"Mustafa Hajeer","orcid":"https://orcid.org/0000-0002-4087-7646"},"institutions":[{"id":"https://openalex.org/I94658018","display_name":"University of Memphis","ror":"https://ror.org/01cq23130","country_code":"US","type":"education","lineage":["https://openalex.org/I94658018"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mustafa Hajeer","raw_affiliation_strings":["University of Memphis, Memphis, TN","University of Memphis, Memphis TN"],"raw_orcid":"https://orcid.org/0000-0002-4087-7646","affiliations":[{"raw_affiliation_string":"University of Memphis, Memphis, TN","institution_ids":["https://openalex.org/I94658018"]},{"raw_affiliation_string":"University of Memphis, Memphis TN","institution_ids":["https://openalex.org/I94658018"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048167872","display_name":"Dipankar Dasgupta","orcid":"https://orcid.org/0000-0002-3097-061X"},"institutions":[{"id":"https://openalex.org/I94658018","display_name":"University of Memphis","ror":"https://ror.org/01cq23130","country_code":"US","type":"education","lineage":["https://openalex.org/I94658018"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dipankar Dasgupta","raw_affiliation_strings":["Center for Information Assurance and Intelligent Security Systems Research Laboratory, The University of Memphis, Memphis, TN","The University of Memphis, Memphis TN"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Information Assurance and Intelligent Security Systems Research Laboratory, The University of Memphis, Memphis, TN","institution_ids":["https://openalex.org/I94658018"]},{"raw_affiliation_string":"The University of Memphis, Memphis TN","institution_ids":["https://openalex.org/I94658018"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I94658018"],"apc_list":null,"apc_paid":null,"fwci":2.4165,"has_fulltext":false,"cited_by_count":33,"citation_normalized_percentile":{"value":0.90752609,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"5","issue":"2","first_page":"134","last_page":"147"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8551561832427979},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.7468388676643372},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5617656707763672},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4838384687900543},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.46064311265945435},{"id":"https://openalex.org/keywords/distributed-file-system","display_name":"Distributed File System","score":0.45680326223373413},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4516160488128662},{"id":"https://openalex.org/keywords/file-system","display_name":"File system","score":0.44391703605651855},{"id":"https://openalex.org/keywords/distributed-database","display_name":"Distributed database","score":0.4388349950313568},{"id":"https://openalex.org/keywords/inefficiency","display_name":"Inefficiency","score":0.4171673655509949},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.37957465648651123},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.17068693041801453}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8551561832427979},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.7468388676643372},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5617656707763672},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4838384687900543},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.46064311265945435},{"id":"https://openalex.org/C152043487","wikidata":"https://www.wikidata.org/wiki/Q1229600","display_name":"Distributed File System","level":2,"score":0.45680326223373413},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4516160488128662},{"id":"https://openalex.org/C2780940931","wikidata":"https://www.wikidata.org/wiki/Q174989","display_name":"File system","level":2,"score":0.44391703605651855},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.4388349950313568},{"id":"https://openalex.org/C2778869765","wikidata":"https://www.wikidata.org/wiki/Q6028363","display_name":"Inefficiency","level":2,"score":0.4171673655509949},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.37957465648651123},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.17068693041801453},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tbdata.2017.2782785","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbdata.2017.2782785","pdf_url":null,"source":{"id":"https://openalex.org/S2491400915","display_name":"IEEE Transactions on Big Data","issn_l":"2332-7790","issn":["2332-7790","2372-2096"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Big Data","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W95475432","https://openalex.org/W144268597","https://openalex.org/W156852397","https://openalex.org/W334811598","https://openalex.org/W1497990247","https://openalex.org/W1551709509","https://openalex.org/W1570991867","https://openalex.org/W1574601653","https://openalex.org/W1635892993","https://openalex.org/W1668065109","https://openalex.org/W1937427849","https://openalex.org/W1963834708","https://openalex.org/W1968999661","https://openalex.org/W1971421925","https://openalex.org/W1971922661","https://openalex.org/W1997482829","https://openalex.org/W2000825106","https://openalex.org/W2003500287","https://openalex.org/W2006606364","https://openalex.org/W2011883628","https://openalex.org/W2016829627","https://openalex.org/W2030696657","https://openalex.org/W2045387243","https://openalex.org/W2047940964","https://openalex.org/W2056259573","https://openalex.org/W2077744467","https://openalex.org/W2089458547","https://openalex.org/W2092865129","https://openalex.org/W2095293504","https://openalex.org/W2097893265","https://openalex.org/W2109726592","https://openalex.org/W2110086534","https://openalex.org/W2114507260","https://openalex.org/W2119625792","https://openalex.org/W2127048411","https://openalex.org/W2138655982","https://openalex.org/W2151936673","https://openalex.org/W2152430833","https://openalex.org/W2161077919","https://openalex.org/W2169490594","https://openalex.org/W2285144687","https://openalex.org/W2289597933","https://openalex.org/W2292704536","https://openalex.org/W2293919922","https://openalex.org/W2295965385","https://openalex.org/W2540570975","https://openalex.org/W2581225544","https://openalex.org/W2592230399","https://openalex.org/W3098742898","https://openalex.org/W3101413764","https://openalex.org/W3102641634","https://openalex.org/W6605883100","https://openalex.org/W6606267987","https://openalex.org/W6636862596","https://openalex.org/W6640568202","https://openalex.org/W6674762369","https://openalex.org/W6696105951","https://openalex.org/W6696671632","https://openalex.org/W6766086608"],"related_works":["https://openalex.org/W1480425691","https://openalex.org/W3042976586","https://openalex.org/W2488366707","https://openalex.org/W2571822082","https://openalex.org/W2225892199","https://openalex.org/W2168643770","https://openalex.org/W2069029637","https://openalex.org/W2593536136","https://openalex.org/W2098632277","https://openalex.org/W3046553064"],"abstract_inverted_index":{"The":[0],"increased":[1],"use":[2,32],"of":[3,14,27,59,70,141,150,162],"cyber-enabled":[4],"systems":[5,45],"and":[6,87,143,171,186],"Internet-of-Things":[7],"(IoT)":[8],"led":[9],"to":[10,77,98,137,157],"a":[11,113,123,159],"massive":[12],"amount":[13],"data":[15,21,64,85,131,142,152,163],"with":[16,48,190],"different":[17],"structures.":[18],"Most":[19],"big":[20],"solutions":[22],"are":[23,65,155],"built":[24],"on":[25,147,177],"top":[26],"the":[28,117,139,151],"Hadoop":[29,118,136],"eco-system":[30],"or":[31],"its":[33,144],"distributed":[34,124],"file":[35],"system":[36],"(HDFS).":[37],"However,":[38],"studies":[39],"have":[40],"shown":[41],"inefficiency":[42],"in":[43,84,89,95],"such":[44],"when":[46],"dealing":[47],"today's":[49,63],"data.":[50,71],"Some":[51],"research":[52],"overcame":[53],"these":[54],"problems":[55,100],"for":[56,116,127],"specific":[57],"types":[58,164],"graph":[60],"data,":[61],"but":[62],"more":[66,103],"than":[67],"one":[68],"type":[69],"Such":[72],"efficiency":[73],"issues":[74],"may":[75],"lead":[76,97],"large-scale":[78],"problems,":[79],"including":[80],"larger":[81],"space":[82],"requirements":[83],"centers,":[86],"waste":[88],"resources":[90],"(like":[91],"power":[92],"consumption),":[93],"that":[94],"turn":[96],"environmental":[99],"(such":[101],"as":[102,108,165,167],"carbon":[104],"emission)":[105],"[1]":[106],",":[107],"per":[109],"scholars.":[110],"We":[111,120,154,174],"propose":[112,122],"data-aware":[114],"module":[115],"eco-system.":[119],"also":[121],"encoding":[125],"technique":[126],"genetic":[128],"algorithms":[129],"efficient":[130],"processing.":[132],"Our":[133],"framework":[134],"allows":[135],"manage":[138],"distribution":[140],"placement":[145],"based":[146],"cluster":[148],"analysis":[149],"itself.":[153],"able":[156],"handle":[158],"broad":[160],"range":[161],"well":[166],"optimize":[168],"query":[169],"time":[170],"resource":[172],"usage.":[173],"performed":[175],"experiments":[176],"multiple":[178],"datasets":[179],"generated":[180],"via":[181],"LUBM":[182],"(Lehigh":[183],"University":[184],"Benchmark)":[185],"reported":[187],"results":[188],"along":[189],"performance":[191],"analysis.":[192]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":3}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
