{"id":"https://openalex.org/W3174688741","doi":"https://doi.org/10.1145/3448016.3452798","title":"Adaptive Compression for Fast Scans on String Columns","display_name":"Adaptive Compression for Fast Scans on String Columns","publication_year":2021,"publication_date":"2021-06-09","ids":{"openalex":"https://openalex.org/W3174688741","doi":"https://doi.org/10.1145/3448016.3452798","mag":"3174688741"},"language":"en","primary_location":{"id":"doi:10.1145/3448016.3452798","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448016.3452798","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Management of Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036614082","display_name":"Yannis Foufoulas","orcid":"https://orcid.org/0000-0002-2785-946X"},"institutions":[{"id":"https://openalex.org/I200777214","display_name":"National and Kapodistrian University of Athens","ror":"https://ror.org/04gnjpq42","country_code":"GR","type":"education","lineage":["https://openalex.org/I200777214"]},{"id":"https://openalex.org/I4210156054","display_name":"Athena Research and Innovation Center In Information Communication & Knowledge Technologies","ror":"https://ror.org/0576by029","country_code":"GR","type":"facility","lineage":["https://openalex.org/I4210156054"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Yannis Foufoulas","raw_affiliation_strings":["University of Athens &amp; Athena Research Center, Athens, Greece"],"affiliations":[{"raw_affiliation_string":"University of Athens &amp; Athena Research Center, Athens, Greece","institution_ids":["https://openalex.org/I4210156054","https://openalex.org/I200777214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062962519","display_name":"Lefteris Sidirourgos","orcid":null},"institutions":[{"id":"https://openalex.org/I200777214","display_name":"National and Kapodistrian University of Athens","ror":"https://ror.org/04gnjpq42","country_code":"GR","type":"education","lineage":["https://openalex.org/I200777214"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Lefteris Sidirourgos","raw_affiliation_strings":["University of Athens, Athens, Greece"],"affiliations":[{"raw_affiliation_string":"University of Athens, Athens, Greece","institution_ids":["https://openalex.org/I200777214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064712737","display_name":"Eleftherios Stamatogiannakis","orcid":null},"institutions":[{"id":"https://openalex.org/I200777214","display_name":"National and Kapodistrian University of Athens","ror":"https://ror.org/04gnjpq42","country_code":"GR","type":"education","lineage":["https://openalex.org/I200777214"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Eleftherios Stamatogiannakis","raw_affiliation_strings":["University of Athens, Athens, Greece"],"affiliations":[{"raw_affiliation_string":"University of Athens, Athens, Greece","institution_ids":["https://openalex.org/I200777214"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084870386","display_name":"Yannis Ioannidis","orcid":"https://orcid.org/0000-0002-1705-8247"},"institutions":[{"id":"https://openalex.org/I4210156054","display_name":"Athena Research and Innovation Center In Information Communication & Knowledge Technologies","ror":"https://ror.org/0576by029","country_code":"GR","type":"facility","lineage":["https://openalex.org/I4210156054"]},{"id":"https://openalex.org/I200777214","display_name":"National and Kapodistrian University of Athens","ror":"https://ror.org/04gnjpq42","country_code":"GR","type":"education","lineage":["https://openalex.org/I200777214"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Yannis Ioannidis","raw_affiliation_strings":["Athena Research Center &amp; University of Athens, Athens, Greece"],"affiliations":[{"raw_affiliation_string":"Athena Research Center &amp; University of Athens, Athens, Greece","institution_ids":["https://openalex.org/I4210156054","https://openalex.org/I200777214"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5036614082"],"corresponding_institution_ids":["https://openalex.org/I200777214","https://openalex.org/I4210156054"],"apc_list":null,"apc_paid":null,"fwci":0.6113,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.69311498,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"554","last_page":"562"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8376767635345459},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.7049766182899475},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.6372550129890442},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.6364001035690308},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5348490476608276},{"id":"https://openalex.org/keywords/compression-ratio","display_name":"Compression ratio","score":0.5140827298164368},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5006227493286133},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4845063388347626},{"id":"https://openalex.org/keywords/associative-array","display_name":"Associative array","score":0.47730839252471924},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4309687614440918},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.382637619972229},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22448381781578064}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8376767635345459},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.7049766182899475},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.6372550129890442},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.6364001035690308},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5348490476608276},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.5140827298164368},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5006227493286133},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4845063388347626},{"id":"https://openalex.org/C168781493","wikidata":"https://www.wikidata.org/wiki/Q80585","display_name":"Associative array","level":2,"score":0.47730839252471924},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4309687614440918},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.382637619972229},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22448381781578064},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C511840579","wikidata":"https://www.wikidata.org/wiki/Q12757","display_name":"Internal combustion engine","level":2,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C171146098","wikidata":"https://www.wikidata.org/wiki/Q124192","display_name":"Automotive engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3448016.3452798","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448016.3452798","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Management of Data","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7699999809265137,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1494049834","https://openalex.org/W1584770030","https://openalex.org/W1967601791","https://openalex.org/W2054046497","https://openalex.org/W2080092502","https://openalex.org/W2085601491","https://openalex.org/W2102639991","https://openalex.org/W2106625078","https://openalex.org/W2123686039","https://openalex.org/W2135010923","https://openalex.org/W2140453381","https://openalex.org/W2151131744","https://openalex.org/W2156930555","https://openalex.org/W2172220707","https://openalex.org/W2340222647","https://openalex.org/W2439390339","https://openalex.org/W2950969408","https://openalex.org/W2955799495"],"related_works":["https://openalex.org/W4383723869","https://openalex.org/W2161302774","https://openalex.org/W2388481516","https://openalex.org/W4384298135","https://openalex.org/W4383722264","https://openalex.org/W1723410974","https://openalex.org/W3007688875","https://openalex.org/W2766695209","https://openalex.org/W3123970444","https://openalex.org/W2110517301"],"abstract_inverted_index":{"State-of-the-art":[0],"OLAP":[1],"systems":[2],"tend":[3],"to":[4,18,27,105,156],"use":[5],"columnar":[6],"data":[7,58],"representations,":[8],"as":[9],"these":[10],"are":[11],"both":[12,92],"suitable":[13],"for":[14,32,123],"analytics":[15],"and":[16,49,63,90,95,113],"amenable":[17],"compression.":[19],"Local":[20],"dictionary":[21,53,65,124,144],"value":[22],"encoding":[23],"has":[24,131],"been":[25],"shown":[26],"achieve":[28],"high":[29],"compression":[30,54,82,145],"rates":[31],"string":[33],"columns":[34],"while":[35],"still":[36],"allowing":[37],"fast":[38],"filtered":[39,71],"scans.":[40],"In":[41],"this":[42,76],"paper,":[43],"we":[44,78],"argue":[45],"that":[46,84],"the":[47,103,120,141],"effectiveness":[48],"efficiency":[50,94],"of":[51,129,159],"local":[52],"is":[55,85,147],"limited":[56],"by":[57,64,118],"repetition":[59],"across":[60,109],"file":[61,111],"blocks":[62,112],"look-ups":[66],"inside":[67],"each":[68],"block":[69],"during":[70],"scan":[72],"execution.":[73],"To":[74],"address":[75],"problem,":[77],"introduce":[79],"an":[80,157],"adaptive":[81],"technique":[83],"based":[86],"on":[87],"differential":[88],"dictionaries":[89],"targets":[91],"storage":[93],"query":[96],"performance.":[97],"The":[98],"proposed":[99,142],"scheme":[100,146],"reduces":[101],"dramatically":[102],"need":[104],"store":[106],"repeated":[107],"values":[108],"different":[110],"significantly":[114],"accelerates":[115],"read":[116],"operations":[117],"reducing":[119],"time":[121],"needed":[122],"look-ups.":[125],"A":[126],"preliminary":[127],"set":[128],"experiments":[130],"given":[132],"very":[133],"promising":[134],"results,":[135],"showing":[136],"that,":[137],"in":[138],"many":[139],"cases,":[140],"new":[143],"much":[148],"more":[149],"efficient":[150],"than":[151],"existing":[152],"techniques,":[153],"occasionally":[154],"up":[155],"order":[158],"magnitude.":[160]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
