{"id":"https://openalex.org/W4414986814","doi":"https://doi.org/10.1002/cpe.70337","title":"A Systematic Overview of Caching Mechanisms to Improve Hadoop Performance","display_name":"A Systematic Overview of Caching Mechanisms to Improve Hadoop Performance","publication_year":2025,"publication_date":"2025-10-07","ids":{"openalex":"https://openalex.org/W4414986814","doi":"https://doi.org/10.1002/cpe.70337"},"language":"en","primary_location":{"id":"doi:10.1002/cpe.70337","is_oa":false,"landing_page_url":"https://doi.org/10.1002/cpe.70337","pdf_url":null,"source":{"id":"https://openalex.org/S11065456","display_name":"Concurrency and Computation Practice and Experience","issn_l":"1532-0626","issn":["1532-0626","1532-0634"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Concurrency and Computation: Practice and Experience","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015729399","display_name":"Rana Ghazali","orcid":"https://orcid.org/0009-0001-7857-2231"},"institutions":[{"id":"https://openalex.org/I183067279","display_name":"Islamic Azad University North Tehran Branch","ror":"https://ror.org/00sb1nr29","country_code":"IR","type":"education","lineage":["https://openalex.org/I110525433","https://openalex.org/I183067279"]},{"id":"https://openalex.org/I98251732","display_name":"McMaster University","ror":"https://ror.org/02fa3aq29","country_code":"CA","type":"education","lineage":["https://openalex.org/I98251732"]}],"countries":["CA","IR"],"is_corresponding":true,"raw_author_name":"Rana Ghazali","raw_affiliation_strings":["Department of Computer Engineering North Tehran Branch, Islamic Azad University  Tehran Iran","Department of Computing and Software McMaster University  Hamilton Ontario Canada","Department of Computing and Software, McMaster University, Hamilton, Ontario, Canada","Department of Computer Engineering, North Tehran Branch, Islamic Azad University, Tehran, Iran"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering North Tehran Branch, Islamic Azad University  Tehran Iran","institution_ids":["https://openalex.org/I183067279"]},{"raw_affiliation_string":"Department of Computing and Software McMaster University  Hamilton Ontario Canada","institution_ids":["https://openalex.org/I98251732"]},{"raw_affiliation_string":"Department of Computing and Software, McMaster University, Hamilton, Ontario, Canada","institution_ids":["https://openalex.org/I98251732"]},{"raw_affiliation_string":"Department of Computer Engineering, North Tehran Branch, Islamic Azad University, Tehran, Iran","institution_ids":["https://openalex.org/I183067279"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000267488","display_name":"Douglas G. Down","orcid":"https://orcid.org/0000-0003-0881-831X"},"institutions":[{"id":"https://openalex.org/I98251732","display_name":"McMaster University","ror":"https://ror.org/02fa3aq29","country_code":"CA","type":"education","lineage":["https://openalex.org/I98251732"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Douglas G. Down","raw_affiliation_strings":["Department of Computing and Software McMaster University  Hamilton Ontario Canada","Department of Computing and Software, McMaster University, Hamilton, Ontario, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Computing and Software McMaster University  Hamilton Ontario Canada","institution_ids":["https://openalex.org/I98251732"]},{"raw_affiliation_string":"Department of Computing and Software, McMaster University, Hamilton, Ontario, Canada","institution_ids":["https://openalex.org/I98251732"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5015729399"],"corresponding_institution_ids":["https://openalex.org/I183067279","https://openalex.org/I98251732"],"apc_list":{"value":4740,"currency":"USD","value_usd":4740},"apc_paid":null,"fwci":1.6666,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.88896849,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"37","issue":"25-26","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.7498000264167786},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5236999988555908},{"id":"https://openalex.org/keywords/data-access","display_name":"Data access","score":0.41029998660087585},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.3871000111103058},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.3817000091075897},{"id":"https://openalex.org/keywords/distributed-database","display_name":"Distributed database","score":0.3682999908924103},{"id":"https://openalex.org/keywords/cache-algorithms","display_name":"Cache algorithms","score":0.35989999771118164}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9161999821662903},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.7498000264167786},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5236999988555908},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5001000165939331},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.41029998660087585},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.39730000495910645},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3871000111103058},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.3817000091075897},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.3682999908924103},{"id":"https://openalex.org/C38556500","wikidata":"https://www.wikidata.org/wiki/Q13404475","display_name":"Cache algorithms","level":4,"score":0.35989999771118164},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.33550000190734863},{"id":"https://openalex.org/C63540848","wikidata":"https://www.wikidata.org/wiki/Q3140932","display_name":"Fault tolerance","level":2,"score":0.323199987411499},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.3091999888420105},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.29670000076293945},{"id":"https://openalex.org/C5165142","wikidata":"https://www.wikidata.org/wiki/Q5432732","display_name":"False sharing","level":5,"score":0.29339998960494995},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.2700999975204468},{"id":"https://openalex.org/C19012869","wikidata":"https://www.wikidata.org/wiki/Q578372","display_name":"Response time","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C1668388","wikidata":"https://www.wikidata.org/wiki/Q1149776","display_name":"Data management","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2572999894618988}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1002/cpe.70337","is_oa":false,"landing_page_url":"https://doi.org/10.1002/cpe.70337","pdf_url":null,"source":{"id":"https://openalex.org/S11065456","display_name":"Concurrency and Computation Practice and Experience","issn_l":"1532-0626","issn":["1532-0626","1532-0634"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Concurrency and Computation: Practice and Experience","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W786186891","https://openalex.org/W2010929544","https://openalex.org/W2013344760","https://openalex.org/W2272536022","https://openalex.org/W2318846467","https://openalex.org/W2496006161","https://openalex.org/W2522680599","https://openalex.org/W2585382847","https://openalex.org/W2618576559","https://openalex.org/W2992109006","https://openalex.org/W3145616277","https://openalex.org/W3168246045","https://openalex.org/W4244412182","https://openalex.org/W4248729482","https://openalex.org/W4256178460","https://openalex.org/W4286268163","https://openalex.org/W4288885705","https://openalex.org/W4296448983","https://openalex.org/W4402845312","https://openalex.org/W4405182331","https://openalex.org/W4409550548","https://openalex.org/W4411747314"],"related_works":[],"abstract_inverted_index":{"ABSTRACT":[0],"In":[1],"today's":[2],"distributed":[3,46],"computing":[4],"environments,":[5],"the":[6,122,155,176,187,221,235,246],"rapid":[7],"generation":[8],"of":[9,20,112,157,178,189,223],"large\u2010scale":[10],"data":[11,41,64,90,94,262,294],"from":[12,59,228],"diverse":[13],"sources":[14],"poses":[15],"significant":[16,312],"challenges":[17,185],"in":[18,51,275,306,314],"terms":[19],"storage,":[21],"management,":[22],"and":[23,54,69,99,109,150,186,206,293],"processing,":[24],"particularly":[25],"for":[26,38,116,193,265,317],"traditional":[27,247],"relational":[28],"databases.":[29],"Hadoop":[30,57,124,165,183,318],"has":[31],"emerged":[32],"as":[33,141,201,216],"a":[34,106,202,208,254,279,311],"widely":[35],"adopted":[36],"framework":[37],"handling":[39],"such":[40,140],"through":[42],"parallel":[43],"processing":[44],"across":[45],"clusters.":[47],"Despite":[48],"its":[49],"advantages":[50],"scalability,":[52],"flexibility,":[53],"fault":[55],"tolerance,":[56],"suffers":[58],"inefficiencies":[60],"related":[61],"to":[62,259],"high":[63],"access":[65,91,151,263],"latency,":[66],"redundant":[67],"computations,":[68,98],"I/O":[70],"overhead,":[71],"which":[72,244],"degrade":[73],"overall":[74],"system":[75],"performance.":[76],"To":[77,153],"mitigate":[78],"these":[79,158],"issues,":[80],"researchers":[81],"have":[82],"proposed":[83],"various":[84],"caching":[85,114,138,159,200,316],"mechanisms":[86],"aimed":[87],"at":[88],"improving":[89],"time,":[92,309],"enhancing":[93],"locality,":[95],"minimizing":[96],"duplicate":[97],"optimizing":[100],"resource":[101],"utilization.":[102],"This":[103],"paper":[104],"provides":[105],"comprehensive":[107],"survey":[108,197],"novel":[110,209],"classification":[111],"existing":[113],"strategies":[115],"Hadoop,":[117],"categorizing":[118],"them":[119],"based":[120,135],"on":[121,136,163],"specific":[123,182],"performance":[125,166,184,190],"bottlenecks":[126],"they":[127],"address.":[128],"A":[129],"detailed":[130],"comparative":[131],"analysis":[132],"is":[133,168,234,270],"provided":[134],"critical":[137],"characteristics":[139],"cached":[142],"item":[143],"type,":[144],"cache":[145,249,291],"management":[146],"policies,":[147],"replacement":[148,250],"strategies,":[149],"patterns.":[152],"assess":[154],"effectiveness":[156],"mechanisms,":[160],"their":[161],"impact":[162],"key":[164],"metrics":[167,191],"evaluated.":[169],"Also,":[170],"statistical":[171],"insights":[172],"are":[173],"presented,":[174],"highlighting":[175],"percentage":[177],"reviewed":[179],"studies":[180],"addressing":[181],"frequency":[188],"used":[192],"evaluation.":[194],"Finally,":[195],"this":[196],"identifies":[198],"hybrid":[199],"promising":[203],"future":[204,261],"trend":[205],"proposes":[207],"approach":[210],"termed":[211],"Hybrid":[212,236],"Intelligent":[213],"Cache":[214,271],"(HIC)":[215],"an":[217,302],"example.":[218],"HIC":[219,300],"combines":[220],"strengths":[222],"two":[224],"previously":[225],"developed":[226],"methods":[227],"distinct":[229],"categories.":[230],"The":[231,268],"first":[232],"method":[233],"Support":[237,255],"Vector":[238,256],"Machine\u2013Least":[239],"Recently":[240],"Used":[241],"(H\u2010SVM\u2010LRU)":[242],"algorithm,":[243],"enhances":[245],"LRU":[248],"strategy":[251],"by":[252,288],"employing":[253],"Machine":[257],"(SVM)":[258],"predict":[260],"patterns":[264],"intelligent":[266,315],"eviction.":[267],"second":[269],"Locality":[272],"with":[273],"Q\u2010Learning":[274],"MapReduce":[276],"Scheduling":[277],"(CLQLMRS),":[278],"reinforcement":[280],"learning\u2013based":[281],"scheduling":[282],"technique":[283],"that":[284,299],"optimizes":[285],"task":[286],"allocation":[287],"maximizing":[289],"both":[290],"locality":[292],"locality.":[295],"Experimental":[296],"results":[297],"demonstrate":[298],"yields":[301],"average":[303],"31.2%":[304],"improvement":[305],"job":[307],"execution":[308],"marking":[310],"advancement":[313],"ecosystems.":[319]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
