{"id":"https://openalex.org/W4283650604","doi":"https://doi.org/10.48550/arxiv.2206.12380","title":"VIP Hashing -- Adapting to Skew in Popularity of Data on the Fly (extended version)","display_name":"VIP Hashing -- Adapting to Skew in Popularity of Data on the Fly (extended version)","publication_year":2022,"publication_date":"2022-06-24","ids":{"openalex":"https://openalex.org/W4283650604","doi":"https://doi.org/10.48550/arxiv.2206.12380"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2206.12380","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.12380","pdf_url":"https://arxiv.org/pdf/2206.12380","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2206.12380","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029848318","display_name":"Aarati Kakaraparthy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kakaraparthy, Aarati","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069237428","display_name":"Jignesh M. Patel","orcid":"https://orcid.org/0000-0003-3653-2538"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Patel, Jignesh M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085163415","display_name":"Brian Kroth","orcid":"https://orcid.org/0000-0002-5108-6743"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kroth, Brian P.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5010089204","display_name":"Kwanghyun Park","orcid":"https://orcid.org/0000-0003-0757-2725"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Kwanghyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7835932970046997},{"id":"https://openalex.org/keywords/skew","display_name":"Skew","score":0.764001190662384},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.6716796159744263},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.6552183628082275},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.5452873706817627},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5198888778686523},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.4561024308204651},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4422786831855774},{"id":"https://openalex.org/keywords/dynamic-perfect-hashing","display_name":"Dynamic perfect hashing","score":0.42598414421081543},{"id":"https://openalex.org/keywords/linear-hashing","display_name":"Linear hashing","score":0.41938528418540955},{"id":"https://openalex.org/keywords/double-hashing","display_name":"Double hashing","score":0.29482412338256836},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.1491032838821411},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.13073375821113586},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1269012689590454}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7835932970046997},{"id":"https://openalex.org/C43711488","wikidata":"https://www.wikidata.org/wiki/Q7534783","display_name":"Skew","level":2,"score":0.764001190662384},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.6716796159744263},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.6552183628082275},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.5452873706817627},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5198888778686523},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.4561024308204651},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4422786831855774},{"id":"https://openalex.org/C122907437","wikidata":"https://www.wikidata.org/wiki/Q5318999","display_name":"Dynamic perfect hashing","level":5,"score":0.42598414421081543},{"id":"https://openalex.org/C36375716","wikidata":"https://www.wikidata.org/wiki/Q6553456","display_name":"Linear hashing","level":5,"score":0.41938528418540955},{"id":"https://openalex.org/C138111711","wikidata":"https://www.wikidata.org/wiki/Q478351","display_name":"Double hashing","level":4,"score":0.29482412338256836},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.1491032838821411},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.13073375821113586},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1269012689590454},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2206.12380","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.12380","pdf_url":"https://arxiv.org/pdf/2206.12380","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2206.12380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2206.12380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2206.12380","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.12380","pdf_url":"https://arxiv.org/pdf/2206.12380","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2334522381","https://openalex.org/W2076162755","https://openalex.org/W2084899141","https://openalex.org/W2811247857","https://openalex.org/W102859714","https://openalex.org/W3108021595","https://openalex.org/W2040748620","https://openalex.org/W1994360333","https://openalex.org/W2390631617","https://openalex.org/W4385261619"],"abstract_inverted_index":{"All":[0],"data":[1,10,26,55],"is":[2,11,74,146,242],"not":[3],"equally":[4],"popular.":[5],"Often,":[6],"some":[7],"portion":[8],"of":[9,24,82,102,170,189,225,237],"more":[12],"frequently":[13],"accessed":[14],"than":[15],"the":[16,25,43,66,80,100,129,135,152,158,187,233,243],"rest,":[17],"which":[18,241],"causes":[19],"a":[20,75,117,168,175,198],"skew":[21,31,67,130,190],"in":[22,42,68,131,151,186,193],"popularity":[23,69,132,153,223],"items.":[27],"Adapting":[28],"to":[29,79,155,216],"this":[30,36,49,111],"can":[32,64,107],"improve":[33],"performance,":[34],"and":[35,60,86,133,143,180,218,221],"topic":[37],"has":[38],"been":[39],"studied":[40],"extensively":[41],"past":[44],"for":[45,70,127,197],"disk-based":[46],"settings.":[47],"In":[48,110],"work,":[50],"we":[51,113],"consider":[52],"an":[53],"in-memory":[54],"structure,":[56],"namely":[57],"hash":[58,120,136,199],"table,":[59],"show":[61],"how":[62],"one":[63,202],"leverage":[65],"higher":[71],"performance.":[72],"Hashing":[73],"low-latency":[76],"operation,":[77],"sensitive":[78],"effects":[81],"caching,":[83],"branch":[84],"prediction,":[85],"code":[87],"complexity":[88],"among":[89],"other":[90],"factors.":[91],"These":[92,139],"factors":[93],"make":[94],"learning":[95,128,159],"in-the-loop":[96],"especially":[97],"challenging":[98],"as":[99,161],"overhead":[101,145],"performing":[103],"any":[104],"additional":[105],"operations":[106],"be":[108],"significant.":[109],"paper,":[112],"propose":[114],"VIP":[115,165,230],"hashing,":[116],"fully":[118],"online":[119],"table":[121,137,200],"method,":[122],"that":[123,182,229],"uses":[124],"lightweight":[125],"mechanisms":[126,140],"adapting":[134],"layout.":[138],"are":[141],"non-blocking,":[142],"their":[144],"controlled":[147],"by":[148,173,248],"sensing":[149],"changes":[150],"distribution":[154,224],"dynamically":[156],"switch-on/off":[157],"mechanism":[160],"needed.":[162],"We":[163,227],"tested":[164],"hashing":[166,177,231],"against":[167],"variety":[169],"workloads":[171],"generated":[172],"Wiscer,":[174],"homegrown":[176],"measurement":[178],"tool,":[179],"find":[181,228],"it":[183],"improves":[184],"performance":[185],"presence":[188],"(22%":[191],"increase":[192,209],"fetch":[194],"operation":[195],"throughput":[196],"with":[201],"million":[203],"keys":[204],"under":[205,210,250],"low":[206],"skew,":[207],"77%":[208],"medium":[211,251],"skew)":[212],"while":[213],"being":[214],"robust":[215],"insert":[217],"delete":[219],"operations,":[220],"changing":[222],"keys.":[226],"reduces":[232],"end-to-end":[234],"execution":[235],"time":[236],"TPC-H":[238,246],"query":[239],"9,":[240],"most":[244],"expensive":[245],"query,":[247],"20%":[249],"skew.":[252]},"counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2022-06-29T00:00:00"}
