{"id":"https://openalex.org/W2334418087","doi":"https://doi.org/10.1109/tpds.2016.2546909","title":"Leaky Buffer: A Novel Abstraction for Relieving Memory Pressure from Cluster Data Processing Frameworks","display_name":"Leaky Buffer: A Novel Abstraction for Relieving Memory Pressure from Cluster Data Processing Frameworks","publication_year":2016,"publication_date":"2016-03-25","ids":{"openalex":"https://openalex.org/W2334418087","doi":"https://doi.org/10.1109/tpds.2016.2546909","mag":"2334418087"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2016.2546909","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2016.2546909","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054420886","display_name":"Zhaolei Liu","orcid":"https://orcid.org/0009-0009-4831-8185"},"institutions":[{"id":"https://openalex.org/I74775410","display_name":"Rice University","ror":"https://ror.org/008zs3103","country_code":"US","type":"education","lineage":["https://openalex.org/I74775410"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhaolei Liu","raw_affiliation_strings":["Computer Science Department, Rice University, Houston, TX"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Rice University, Houston, TX","institution_ids":["https://openalex.org/I74775410"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075120727","display_name":"T. S. Eugene Ng","orcid":"https://orcid.org/0000-0003-2954-0767"},"institutions":[{"id":"https://openalex.org/I74775410","display_name":"Rice University","ror":"https://ror.org/008zs3103","country_code":"US","type":"education","lineage":["https://openalex.org/I74775410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"T. S. Eugene Ng","raw_affiliation_strings":["Computer Science Department, Rice University, Houston, TX"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Rice University, Houston, TX","institution_ids":["https://openalex.org/I74775410"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5054420886"],"corresponding_institution_ids":["https://openalex.org/I74775410"],"apc_list":null,"apc_paid":null,"fwci":5.5429,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.95759171,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"28","issue":"1","first_page":"128","last_page":"140"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8879989385604858},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.6092744469642639},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.5632057785987854},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.5450729131698608},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.47643500566482544},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4465036690235138},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.44234782457351685},{"id":"https://openalex.org/keywords/overlay","display_name":"Overlay","score":0.18629536032676697},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.167809396982193},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.13612207770347595}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8879989385604858},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.6092744469642639},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.5632057785987854},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.5450729131698608},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.47643500566482544},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4465036690235138},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.44234782457351685},{"id":"https://openalex.org/C136085584","wikidata":"https://www.wikidata.org/wiki/Q910289","display_name":"Overlay","level":2,"score":0.18629536032676697},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.167809396982193},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.13612207770347595},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpds.2016.2546909","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2016.2546909","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},{"id":"pmh:oai:scholarship.rice.edu:1911/88106","is_oa":false,"landing_page_url":"http://hdl.handle.net/1911/88106","pdf_url":null,"source":{"id":"https://openalex.org/S4306401268","display_name":"Rice Digital Scholarship Archive (Rice University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I74775410","host_organization_name":"Rice University","host_organization_lineage":["https://openalex.org/I74775410"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Thesis"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.6100000143051147}],"awards":[{"id":"https://openalex.org/G1174379293","display_name":null,"funder_award_id":"CNS1305379","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5895531025","display_name":null,"funder_award_id":"CNS1162270","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8436838985","display_name":null,"funder_award_id":"CNS1422925","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320307762","display_name":"International Business Machines Corporation","ror":"https://ror.org/05hh8d621"},{"id":"https://openalex.org/F4320307764","display_name":"Microsoft","ror":"https://ror.org/00d0nc645"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1473115402","https://openalex.org/W1573783702","https://openalex.org/W1791587242","https://openalex.org/W1890643295","https://openalex.org/W2002472616","https://openalex.org/W2006140865","https://openalex.org/W2021932022","https://openalex.org/W2038157364","https://openalex.org/W2077967211","https://openalex.org/W2097484305","https://openalex.org/W2114303224","https://openalex.org/W2129726725","https://openalex.org/W2131975293","https://openalex.org/W2139072600","https://openalex.org/W2144518192","https://openalex.org/W2155072926","https://openalex.org/W2158535916","https://openalex.org/W2162709812","https://openalex.org/W2173213060","https://openalex.org/W2482213519","https://openalex.org/W2951128501","https://openalex.org/W3138367763","https://openalex.org/W6628737838","https://openalex.org/W6634337025","https://openalex.org/W6638231387","https://openalex.org/W6639249596","https://openalex.org/W6669897081"],"related_works":["https://openalex.org/W3015859229","https://openalex.org/W2230552005","https://openalex.org/W1975949872","https://openalex.org/W3159871278","https://openalex.org/W2905242764","https://openalex.org/W3109411864","https://openalex.org/W3017846737","https://openalex.org/W3003280185","https://openalex.org/W2942295204","https://openalex.org/W2792915651"],"abstract_inverted_index":{"The":[0,62],"shift":[1],"to":[2,36,55,142,187,196],"the":[3,14,24,33,44,76,85,93,100,112,118,122,144,171,178],"in-memory":[4,34,48],"data":[5,18,157],"processing":[6,19,158],"paradigm":[7,35],"has":[8],"had":[9],"a":[10,72,107,128,162],"major":[11],"influence":[12],"on":[13,99,161],"development":[15],"of":[16,46,64,75,117,164,180],"cluster":[17],"frameworks.":[20,159],"Numerous":[21],"frameworks":[22],"from":[23],"industry,":[25],"open":[26],"source":[27],"community":[28],"and":[29,39,60,80,135,190],"academia":[30],"are":[31,53,67],"adopting":[32],"achieve":[37],"functionalities":[38],"performance":[40,58,86,184],"breakthroughs.":[41],"However,":[42],"despite":[43],"advantages":[45],"these":[47],"frameworks,":[49],"in":[50,133,152],"practice":[51],"they":[52],"susceptible":[54],"memory-pressure":[56],"related":[57],"collapse":[59],"failures.":[61],"contributions":[63],"this":[65],"paper":[66],"twofold.":[68],"First,":[69],"we":[70,105,136],"conduct":[71],"detailed":[73],"diagnosis":[74],"memory":[77,165,192],"pressure":[78],"problem":[79,94],"identify":[81],"three":[82],"preconditions":[83,89],"for":[84],"collapse.":[87],"These":[88],"not":[90],"only":[91],"explain":[92],"but":[95],"also":[96,140],"shed":[97],"light":[98],"possible":[101],"solution":[102],"strategies.":[103],"Second,":[104],"propose":[106],"novel":[108],"programming":[109],"abstraction":[110,174],"called":[111],"leaky":[113,129,172],"bufferthat":[114],"eliminates":[115],"one":[116],"preconditions,":[119],"thereby":[120],"addressing":[121],"underlying":[123],"problem.":[124],"We":[125],"have":[126],"implemented":[127],"buffer":[130,173],"enabled":[131],"hashtable":[132,145],"Spark,":[134],"believe":[137],"it":[138],"is":[139],"able":[141],"substitute":[143],"that":[146,170],"performs":[147],"similar":[148],"hash":[149],"aggregation":[150,167],"operations":[151,168],"any":[153],"other":[154],"programs":[155],"or":[156],"Experiments":[160],"range":[163],"intensive":[166],"show":[169],"can":[175],"drastically":[176],"reduce":[177,191],"occurrence":[179],"memoryrelated":[181],"failures,":[182],"improve":[183],"by":[185,194],"up":[186,195],"507":[188],"percent":[189],"usage":[193],"87.5":[197],"percent.":[198]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
