{"id":"https://openalex.org/W2784168307","doi":"https://doi.org/10.1145/3159652.3159663","title":"Index Compression Using Byte-Aligned ANS Coding and Two-Dimensional Contexts","display_name":"Index Compression Using Byte-Aligned ANS Coding and Two-Dimensional Contexts","publication_year":2018,"publication_date":"2018-02-02","ids":{"openalex":"https://openalex.org/W2784168307","doi":"https://doi.org/10.1145/3159652.3159663","mag":"2784168307"},"language":"en","primary_location":{"id":"doi:10.1145/3159652.3159663","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3159652.3159663","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Eleventh ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081861848","display_name":"Alistair Moffat","orcid":"https://orcid.org/0000-0002-6638-0232"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Alistair Moffat","raw_affiliation_strings":["University of Melbourne, Melbourne, Australia"],"affiliations":[{"raw_affiliation_string":"University of Melbourne, Melbourne, Australia","institution_ids":["https://openalex.org/I165779595"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086980890","display_name":"Matthias Petri","orcid":"https://orcid.org/0000-0002-0054-9429"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Matthias Petri","raw_affiliation_strings":["University of Melbourne, Melbourne, Australia"],"affiliations":[{"raw_affiliation_string":"University of Melbourne, Melbourne, Australia","institution_ids":["https://openalex.org/I165779595"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5081861848"],"corresponding_institution_ids":["https://openalex.org/I165779595"],"apc_list":null,"apc_paid":null,"fwci":2.6061,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.91773777,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"405","last_page":"413"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11321","display_name":"Error Correcting Code Techniques","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7174946069717407},{"id":"https://openalex.org/keywords/arithmetic-coding","display_name":"Arithmetic coding","score":0.5356160402297974},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5306034684181213},{"id":"https://openalex.org/keywords/byte","display_name":"Byte","score":0.5175149440765381},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.5063499212265015},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.4950329661369324},{"id":"https://openalex.org/keywords/lossless-compression","display_name":"Lossless compression","score":0.47151079773902893},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.44105082750320435},{"id":"https://openalex.org/keywords/block-size","display_name":"Block size","score":0.41355371475219727},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4008428156375885},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.32939213514328003},{"id":"https://openalex.org/keywords/context-adaptive-binary-arithmetic-coding","display_name":"Context-adaptive binary arithmetic coding","score":0.25226569175720215},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.2390449345111847},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21756309270858765},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.09205672144889832}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7174946069717407},{"id":"https://openalex.org/C153338461","wikidata":"https://www.wikidata.org/wiki/Q2651","display_name":"Arithmetic coding","level":4,"score":0.5356160402297974},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5306034684181213},{"id":"https://openalex.org/C43364308","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Byte","level":2,"score":0.5175149440765381},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.5063499212265015},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.4950329661369324},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.47151079773902893},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.44105082750320435},{"id":"https://openalex.org/C41431624","wikidata":"https://www.wikidata.org/wiki/Q1053357","display_name":"Block size","level":3,"score":0.41355371475219727},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4008428156375885},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.32939213514328003},{"id":"https://openalex.org/C175732694","wikidata":"https://www.wikidata.org/wiki/Q1128713","display_name":"Context-adaptive binary arithmetic coding","level":3,"score":0.25226569175720215},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.2390449345111847},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21756309270858765},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.09205672144889832},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3159652.3159663","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3159652.3159663","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Eleventh ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W191231183","https://openalex.org/W1494592156","https://openalex.org/W1516527356","https://openalex.org/W1537803653","https://openalex.org/W1559631118","https://openalex.org/W1568325880","https://openalex.org/W1574036524","https://openalex.org/W1577505202","https://openalex.org/W1593203859","https://openalex.org/W1791987072","https://openalex.org/W1933799648","https://openalex.org/W1965473122","https://openalex.org/W1970885105","https://openalex.org/W1976656104","https://openalex.org/W1996930216","https://openalex.org/W2015255214","https://openalex.org/W2022292926","https://openalex.org/W2076471773","https://openalex.org/W2087361130","https://openalex.org/W2089455813","https://openalex.org/W2140453381","https://openalex.org/W2151249511","https://openalex.org/W2152437528","https://openalex.org/W2160484851","https://openalex.org/W2164715417","https://openalex.org/W2341380858","https://openalex.org/W2427788461","https://openalex.org/W2604113568","https://openalex.org/W2612391007","https://openalex.org/W2621280964","https://openalex.org/W2740817677","https://openalex.org/W2767328299","https://openalex.org/W2792921236","https://openalex.org/W3102704970","https://openalex.org/W6640455647"],"related_works":["https://openalex.org/W2948148442","https://openalex.org/W2461250372","https://openalex.org/W2394342941","https://openalex.org/W2169853506","https://openalex.org/W2547124190","https://openalex.org/W2350586049","https://openalex.org/W2096000848","https://openalex.org/W1901494946","https://openalex.org/W2155161695","https://openalex.org/W2123328017"],"abstract_inverted_index":{"We":[0,135],"examine":[1],"approaches":[2],"used":[3,40,62],"for":[4,116],"block-based":[5,166],"inverted":[6],"index":[7,117],"compression,":[8],"such":[9],"as":[10],"the":[11,52,68,75,83,98,120,125,139],"OptPFOR":[12],"mechanism,":[13,127],"in":[14,31,63],"which":[15,32],"fixed-length":[16],"blocks":[17],"of":[18,24,49,54,70,85,100,149],"postings":[19],"data":[20],"are":[21],"compressed":[22],"independently":[23],"each":[25,43,64],"other.":[26],"Building":[27],"on":[28],"previous":[29],"work":[30],"asymmetric":[33],"numeral":[34],"systems":[35],"(ANS)":[36],"entropy":[37],"coding":[38],"is":[39],"to":[41,66,92,105,153,164],"represent":[42],"block,":[44],"we":[45],"explore":[46],"a":[47,86,101,131,145],"number":[48],"enhancements:":[50],"(i)":[51],"use":[53,84,99],"two-dimensional":[55],"conditioning":[56],"contexts,":[57],"with":[58],"two":[59],"aggregate":[60],"parameters":[61],"block":[65],"categorize":[67],"distribution":[69],"symbol":[71],"values":[72],"that":[73,155],"underlies":[74],"ANS":[76,93],"approach,":[77],"rather":[78],"than":[79],"just":[80],"one;":[81],"(ii)":[82],"byte-friendly":[87],"strategic":[88],"mapping":[89],"from":[90],"symbols":[91],"codeword":[94],"buckets;":[95],"and":[96,128,144,157],"(iii)":[97],"context":[102],"merging":[103],"process":[104],"combine":[106],"similar":[107],"probability":[108],"distributions.":[109],"Collectively,":[110],"these":[111],"improvements":[112],"yield":[113],"superior":[114],"compression":[115],"data,":[118],"outperforming":[119],"reference":[121],"point":[122],"set":[123],"by":[124],"Interp":[126],"hence":[129],"representing":[130],"significant":[132],"step":[133],"forward.":[134],"describe":[136],"experiments":[137],"using":[138],"426":[140],"GiB":[141],"gov2":[142],"collection":[143,148],"new":[146],"large":[147],"publicly-available":[150],"news":[151],"articles":[152],"demonstrate":[154],"claim,":[156],"provide":[158],"query":[159],"evaluation":[160],"throughput":[161],"rates":[162],"compared":[163],"other":[165],"mechanisms.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
