{"id":"https://openalex.org/W1996149237","doi":"https://doi.org/10.1109/infocom.2014.6847984","title":"SAP: Similarity-aware partitioning for efficient cloud storage","display_name":"SAP: Similarity-aware partitioning for efficient cloud storage","publication_year":2014,"publication_date":"2014-04-01","ids":{"openalex":"https://openalex.org/W1996149237","doi":"https://doi.org/10.1109/infocom.2014.6847984","mag":"1996149237"},"language":"en","primary_location":{"id":"doi:10.1109/infocom.2014.6847984","is_oa":false,"landing_page_url":"https://doi.org/10.1109/infocom.2014.6847984","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE INFOCOM 2014 - IEEE Conference on Computer Communications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://zenodo.org/record/1273573","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033872928","display_name":"Bharath Balasubramanian","orcid":"https://orcid.org/0000-0003-2002-2349"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Bharath Balasubramanian","raw_affiliation_strings":["Princeton University, NJ, USA","Princeton University , Princeton, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Princeton University, NJ, USA","institution_ids":["https://openalex.org/I20089843"]},{"raw_affiliation_string":"Princeton University , Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018464968","display_name":"Tian Lan","orcid":"https://orcid.org/0000-0003-3010-8090"},"institutions":[{"id":"https://openalex.org/I193531525","display_name":"George Washington University","ror":"https://ror.org/00y4zzh67","country_code":"US","type":"education","lineage":["https://openalex.org/I193531525"]},{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tian Lan","raw_affiliation_strings":["Princeton University, NJ, USA","George Washington University Washington DC USA"],"affiliations":[{"raw_affiliation_string":"Princeton University, NJ, USA","institution_ids":["https://openalex.org/I20089843"]},{"raw_affiliation_string":"George Washington University Washington DC USA","institution_ids":["https://openalex.org/I193531525"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110782105","display_name":"Mung Chiang","orcid":"https://orcid.org/0000-0002-8920-651X"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mung Chiang","raw_affiliation_strings":["Princeton University, NJ, USA","Princeton University , Princeton, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Princeton University, NJ, USA","institution_ids":["https://openalex.org/I20089843"]},{"raw_affiliation_string":"Princeton University , Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5033872928"],"corresponding_institution_ids":["https://openalex.org/I20089843"],"apc_list":null,"apc_paid":null,"fwci":5.7599,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.95695441,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"592","last_page":"600"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10742","display_name":"Peer-to-Peer Network Technologies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7841211557388306},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.6550487875938416},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4697425961494446},{"id":"https://openalex.org/keywords/cloud-storage","display_name":"Cloud storage","score":0.4201315939426422},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.34130480885505676},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.22770556807518005},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.10576769709587097}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7841211557388306},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.6550487875938416},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4697425961494446},{"id":"https://openalex.org/C2777059624","wikidata":"https://www.wikidata.org/wiki/Q914359","display_name":"Cloud storage","level":3,"score":0.4201315939426422},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.34130480885505676},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.22770556807518005},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.10576769709587097},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/infocom.2014.6847984","is_oa":false,"landing_page_url":"https://doi.org/10.1109/infocom.2014.6847984","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE INFOCOM 2014 - IEEE Conference on Computer Communications","raw_type":"proceedings-article"},{"id":"pmh:oai:zenodo.org:1273573","is_oa":true,"landing_page_url":"https://zenodo.org/record/1273573","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferencePaper"}],"best_oa_location":{"id":"pmh:oai:zenodo.org:1273573","is_oa":true,"landing_page_url":"https://zenodo.org/record/1273573","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferencePaper"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W89823361","https://openalex.org/W104626050","https://openalex.org/W174289249","https://openalex.org/W193648907","https://openalex.org/W200233886","https://openalex.org/W1529205966","https://openalex.org/W1609518033","https://openalex.org/W1651093245","https://openalex.org/W1819656317","https://openalex.org/W1984572897","https://openalex.org/W1996149237","https://openalex.org/W2029673812","https://openalex.org/W2062832101","https://openalex.org/W2103128823","https://openalex.org/W2105848461","https://openalex.org/W2109943392","https://openalex.org/W2110322986","https://openalex.org/W2123767107","https://openalex.org/W2133117081","https://openalex.org/W2147755199","https://openalex.org/W2157240622","https://openalex.org/W2166667085","https://openalex.org/W2168595508","https://openalex.org/W2172220707","https://openalex.org/W2331180561","https://openalex.org/W3150003982","https://openalex.org/W6603735688","https://openalex.org/W6607057542","https://openalex.org/W6607794886","https://openalex.org/W6608138927","https://openalex.org/W6631739990","https://openalex.org/W6636190696","https://openalex.org/W6638528349","https://openalex.org/W6681926217","https://openalex.org/W6684674479","https://openalex.org/W6793350840"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W4244478748","https://openalex.org/W4223488648","https://openalex.org/W2134969820","https://openalex.org/W2251605416","https://openalex.org/W2560439919","https://openalex.org/W4389340727","https://openalex.org/W3150465815","https://openalex.org/W1997222214"],"abstract_inverted_index":{"Given":[0],"a":[1,7,14,24,30,59],"set":[2,25],"of":[3,10,17,26,62],"files":[4,45,83,118,137,188],"that":[5,32,149,168,194],"show":[6,148],"certain":[8],"degree":[9],"similarity,":[11],"we":[12,78,114,146,162],"consider":[13],"novel":[15],"problem":[16],"deduplicating":[18],"them":[19,87],"(eliminating":[20],"redundant":[21],"chunks)":[22],"across":[23,88,136],"distributed":[27],"servers":[28,90,100],"in":[29,68,76,112],"manner":[31],"is:":[33],"(i)":[34],"space-efficient:":[35],"the":[36,44,82,89,106,117,120,134,140,164,195,211],"total":[37],"space":[38,141,153,179],"needed":[39],"to":[40,92,101,138,210],"deduplicate":[41,80],"and":[42,84,122,176,191],"store":[43,124],"is":[46,156,198],"minimized":[47],"and,":[48],"(ii)":[49],"access-efficient:":[50],"each":[51,103,129],"file":[52],"can":[53],"be":[54],"accessed":[55],"by":[56],"communicating":[57],"with":[58,98],"bounded":[60,178],"number":[61],"servers,":[63,121],"thereby":[64],"minimizing":[65],"network-access":[66],"times":[67],"congested":[69],"data":[70],"center":[71],"networks.":[72],"A":[73],"space-optimal":[74],"solution":[75,111,155],"which":[77,113],"first":[79,147],"all":[81],"then":[85,123],"distribute":[86],"(referred":[91],"as":[93],"chunk-distribution),":[94],"may":[95,131],"require":[96],"communication":[97],"many":[99],"access":[102],"file.":[104],"On":[105],"other":[107],"hand,":[108],"an":[109,151,157],"access-efficient":[110,170],"randomly":[115],"partition":[116],"cross":[119],"their":[125],"unique":[126],"chunks":[127],"on":[128,187],"server":[130],"not":[132],"exploit":[133],"similarities":[135],"reduce":[139],"overhead.":[142],"In":[143],"this":[144],"paper,":[145],"finding":[150],"access-efficient,":[152],"optimal":[154],"NP-Hard":[158],"problem.":[159],"Following":[160],"this,":[161],"present":[163],"similarity-aware-partitioning":[165],"(SAP)":[166],"algorithms":[167],"find":[169],"solutions":[171],"within":[172],"polynomial":[173],"time":[174],"complexity":[175],"guarantees":[177],"overhead":[180],"for":[181],"arbitrary":[182],"files.":[183],"Our":[184],"experimental":[185],"verification":[186],"from":[189],"Dropbox":[190],"CNN":[192],"confirm":[193],"SAP":[196],"technique":[197],"much":[199],"more":[200],"space-efficient":[201],"than":[202],"random":[203],"partitioning,":[204],"while":[205],"maintaining":[206],"compression":[207],"ratio":[208],"close":[209],"chunk-distribution":[212],"solution.":[213]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
