{"id":"https://openalex.org/W2903455402","doi":"https://doi.org/10.1145/3274808.3274811","title":"Size Matters","display_name":"Size Matters","publication_year":2018,"publication_date":"2018-11-26","ids":{"openalex":"https://openalex.org/W2903455402","doi":"https://doi.org/10.1145/3274808.3274811","mag":"2903455402"},"language":"en","primary_location":{"id":"doi:10.1145/3274808.3274811","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3274808.3274811","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th International Middleware Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:kth:diva-238597","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001436192","display_name":"Salman Niazi","orcid":"https://orcid.org/0000-0002-1672-6899"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Salman Niazi","raw_affiliation_strings":["KTH - Royal Institute of Technology and Logical Clocks AB"],"affiliations":[{"raw_affiliation_string":"KTH - Royal Institute of Technology and Logical Clocks AB","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052059275","display_name":"Mikael Ronstr\u00f6m","orcid":"https://orcid.org/0009-0004-1524-606X"},"institutions":[{"id":"https://openalex.org/I1342911587","display_name":"Oracle (United States)","ror":"https://ror.org/006c77m33","country_code":"US","type":"company","lineage":["https://openalex.org/I1342911587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mikael Ronstr\u00f6m","raw_affiliation_strings":["Oracle AB"],"affiliations":[{"raw_affiliation_string":"Oracle AB","institution_ids":["https://openalex.org/I1342911587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090695078","display_name":"Seif Haridi","orcid":"https://orcid.org/0000-0002-6718-0144"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Seif Haridi","raw_affiliation_strings":["KTH - Royal Institute of Technology and Logical Clocks AB"],"affiliations":[{"raw_affiliation_string":"KTH - Royal Institute of Technology and Logical Clocks AB","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055127792","display_name":"Jim Dowling","orcid":"https://orcid.org/0000-0002-9484-6714"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Jim Dowling","raw_affiliation_strings":["KTH - Royal Institute of Technology and Logical Clocks AB"],"affiliations":[{"raw_affiliation_string":"KTH - Royal Institute of Technology and Logical Clocks AB","institution_ids":["https://openalex.org/I86987016"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5001436192"],"corresponding_institution_ids":["https://openalex.org/I86987016"],"apc_list":null,"apc_paid":null,"fwci":4.9341,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.95842414,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"26","last_page":"39"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8187048435211182},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.7982208728790283},{"id":"https://openalex.org/keywords/distributed-file-system","display_name":"Distributed File System","score":0.7315199375152588},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5750017166137695},{"id":"https://openalex.org/keywords/file-system","display_name":"File system","score":0.5603640079498291},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.5369060039520264},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.5146487951278687},{"id":"https://openalex.org/keywords/file-size","display_name":"File size","score":0.4301108717918396},{"id":"https://openalex.org/keywords/reading","display_name":"Reading (process)","score":0.42160019278526306}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8187048435211182},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.7982208728790283},{"id":"https://openalex.org/C152043487","wikidata":"https://www.wikidata.org/wiki/Q1229600","display_name":"Distributed File System","level":2,"score":0.7315199375152588},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5750017166137695},{"id":"https://openalex.org/C2780940931","wikidata":"https://www.wikidata.org/wiki/Q174989","display_name":"File system","level":2,"score":0.5603640079498291},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5369060039520264},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5146487951278687},{"id":"https://openalex.org/C2776029614","wikidata":"https://www.wikidata.org/wiki/Q1146367","display_name":"File size","level":2,"score":0.4301108717918396},{"id":"https://openalex.org/C554936623","wikidata":"https://www.wikidata.org/wiki/Q199657","display_name":"Reading (process)","level":2,"score":0.42160019278526306},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3274808.3274811","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3274808.3274811","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th International Middleware Conference","raw_type":"proceedings-article"},{"id":"pmh:oai:DiVA.org:kth-238597","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:kth:diva-238597","pdf_url":null,"source":{"id":"https://openalex.org/S4306401559","display_name":"KTH Publication Database DiVA (KTH Royal Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference paper"}],"best_oa_location":{"id":"pmh:oai:DiVA.org:kth-238597","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:kth:diva-238597","pdf_url":null,"source":{"id":"https://openalex.org/S4306401559","display_name":"KTH Publication Database DiVA (KTH Royal Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference paper"},"sustainable_development_goals":[{"score":0.6299999952316284,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G5458775539","display_name":null,"funder_award_id":"732189","funder_id":"https://openalex.org/F4320332999","funder_display_name":"Horizon 2020 Framework Programme"},{"id":"https://openalex.org/G6508133030","display_name":null,"funder_award_id":"RIT15-0119","funder_id":"https://openalex.org/F4320320940","funder_display_name":"Stiftelsen f\u00f6r\u00a0Strategisk Forskning"},{"id":"https://openalex.org/G7331901853","display_name":null,"funder_award_id":"EU H2020","funder_id":"https://openalex.org/F4320332999","funder_display_name":"Horizon 2020 Framework Programme"}],"funders":[{"id":"https://openalex.org/F4320320940","display_name":"Stiftelsen f\u00f6r\u00a0Strategisk Forskning","ror":"https://ror.org/044wr7g58"},{"id":"https://openalex.org/F4320332999","display_name":"Horizon 2020 Framework Programme","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W26797728","https://openalex.org/W1483926990","https://openalex.org/W1529677907","https://openalex.org/W1972058033","https://openalex.org/W1999984505","https://openalex.org/W2004958263","https://openalex.org/W2021060937","https://openalex.org/W2030877481","https://openalex.org/W2035735180","https://openalex.org/W2087946700","https://openalex.org/W2104292367","https://openalex.org/W2110528713","https://openalex.org/W2119565742","https://openalex.org/W2119738171","https://openalex.org/W2122465391","https://openalex.org/W2189465200","https://openalex.org/W2512358767","https://openalex.org/W2584004798","https://openalex.org/W2594680891","https://openalex.org/W2622263826","https://openalex.org/W2726953363","https://openalex.org/W2735439080","https://openalex.org/W2765309291","https://openalex.org/W2908504669","https://openalex.org/W2914583252","https://openalex.org/W2963078748","https://openalex.org/W3113167932","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2098632277","https://openalex.org/W2225892199","https://openalex.org/W2550058611","https://openalex.org/W2593536136","https://openalex.org/W2329901628","https://openalex.org/W3181039328","https://openalex.org/W2506014216","https://openalex.org/W64025680","https://openalex.org/W1876360099","https://openalex.org/W2207899285"],"abstract_inverted_index":{"The":[0,20],"Hadoop":[1,36,125],"Distributed":[2],"File":[3],"System":[4],"(HDFS)":[5],"is":[6,106],"designed":[7,75],"to":[8,91,132],"handle":[9],"massive":[10],"amounts":[11],"of":[12,23,34,42,46,61,98,151,160],"data,":[13],"preferably":[14],"stored":[15,85],"in":[16,25,54,86,102,116,137],"very":[17],"large":[18],"files.":[19,72],"poor":[21],"performance":[22,97],"HDFS":[24,118],"managing":[26],"small":[27,71,100,155],"files":[28,48,101,156],"has":[29],"long":[30],"been":[31],"a":[32,87,158],"bane":[33],"the":[35,47,63,96,99,117,121,124,149],"community.":[37],"In":[38,127],"many":[39],"production":[40],"deployments":[41],"HDFS,":[43],"almost":[44],"25%":[45],"are":[49,67],"less":[50],"than":[51],"16":[52],"KB":[53],"size":[55],"and":[56,82,94,109,140,153,162],"as":[57,59],"much":[58],"42%":[60],"all":[62],"file":[64],"system":[65],"operations":[66],"performed":[68],"on":[69],"these":[70],"We":[73],"have":[74],"an":[76],"adaptive":[77],"tiered":[78],"storage":[79],"using":[80,123],"in-memory":[81],"on-disk":[83],"tables":[84],"high-performance":[88],"distributed":[89],"database":[90],"efficiently":[92],"store":[93],"improve":[95],"HDFS.":[103],"Our":[104],"solution":[105,147],"completely":[107],"transparent,":[108],"it":[110],"does":[111],"not":[112],"require":[113],"any":[114],"changes":[115],"clients":[119],"or":[120],"applications":[122],"platform.":[126],"experiments,":[128],"we":[129],"observed":[130],"up":[131],"61":[133],"times":[134],"higher":[135],"throughput":[136],"writing":[138,154],"files,":[139],"for":[141],"real-world":[142],"workloads":[143],"from":[144],"Spotify":[145],"our":[146],"reduces":[148],"latency":[150],"reading":[152],"by":[157],"factor":[159],"3.15":[161],"7.39":[163],"respectively.":[164]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2018-12-11T00:00:00"}
