{"id":"https://openalex.org/W2158911502","doi":"https://doi.org/10.1145/2063576.2063626","title":"Efficiently encoding term co-occurrences in inverted indexes","display_name":"Efficiently encoding term co-occurrences in inverted indexes","publication_year":2011,"publication_date":"2011-10-24","ids":{"openalex":"https://openalex.org/W2158911502","doi":"https://doi.org/10.1145/2063576.2063626","mag":"2158911502"},"language":"en","primary_location":{"id":"doi:10.1145/2063576.2063626","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2063576.2063626","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 20th ACM international conference on Information and knowledge management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073768909","display_name":"Marcus Fontoura","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marcus Fontoura","raw_affiliation_strings":["Google Inc., Mountain View, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Inc., Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086993894","display_name":"Maxim Gurevich","orcid":"https://orcid.org/0000-0003-4693-0556"},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maxim Gurevich","raw_affiliation_strings":["Yahoo! Research, Santa Clara, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037908462","display_name":"Vanja Josifovski","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vanja Josifovski","raw_affiliation_strings":["Yahoo! Research, Santa Clara, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070795618","display_name":"Sergei Vassilvitskii","orcid":"https://orcid.org/0000-0003-0235-1624"},"institutions":[{"id":"https://openalex.org/I4210133173","display_name":"Research!America (United States)","ror":"https://ror.org/044pgyv50","country_code":"US","type":"company","lineage":["https://openalex.org/I4210133173"]},{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sergei Vassilvitskii","raw_affiliation_strings":["Yahoo! Research, New York, NY, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research, New York, NY, USA","institution_ids":["https://openalex.org/I4210133173","https://openalex.org/I4210134091"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.4967,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.90373844,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"307","last_page":"316"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bitmap","display_name":"Bitmap","score":0.8635662198066711},{"id":"https://openalex.org/keywords/inverted-index","display_name":"Inverted index","score":0.8541658520698547},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8376063108444214},{"id":"https://openalex.org/keywords/precomputation","display_name":"Precomputation","score":0.8276048302650452},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.6496126651763916},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.591818630695343},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.5571267604827881},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5144301056861877},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.5144217610359192},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4783850908279419},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4638296365737915},{"id":"https://openalex.org/keywords/materialized-view","display_name":"Materialized view","score":0.4225974977016449},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.39573174715042114},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.3255329132080078},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.21475091576576233},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1536635160446167},{"id":"https://openalex.org/keywords/view","display_name":"View","score":0.11664947867393494},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07733914256095886}],"concepts":[{"id":"https://openalex.org/C3115412","wikidata":"https://www.wikidata.org/wiki/Q1194708","display_name":"Bitmap","level":2,"score":0.8635662198066711},{"id":"https://openalex.org/C130590232","wikidata":"https://www.wikidata.org/wiki/Q1671754","display_name":"Inverted index","level":3,"score":0.8541658520698547},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8376063108444214},{"id":"https://openalex.org/C159379195","wikidata":"https://www.wikidata.org/wiki/Q7239568","display_name":"Precomputation","level":3,"score":0.8276048302650452},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.6496126651763916},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.591818630695343},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.5571267604827881},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5144301056861877},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.5144217610359192},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4783850908279419},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4638296365737915},{"id":"https://openalex.org/C98199447","wikidata":"https://www.wikidata.org/wiki/Q2445044","display_name":"Materialized view","level":4,"score":0.4225974977016449},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.39573174715042114},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3255329132080078},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.21475091576576233},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1536635160446167},{"id":"https://openalex.org/C54239708","wikidata":"https://www.wikidata.org/wiki/Q1329910","display_name":"View","level":3,"score":0.11664947867393494},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07733914256095886},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C148840519","wikidata":"https://www.wikidata.org/wiki/Q1049878","display_name":"Database design","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2063576.2063626","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2063576.2063626","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 20th ACM international conference on Information and knowledge management","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.308.2883","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.308.2883","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://static.googleusercontent.com/external_content/untrusted_dlcp/research.google.com/en/us/pubs/archive/37367.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W1531395322","https://openalex.org/W1537796421","https://openalex.org/W1556741196","https://openalex.org/W1561988317","https://openalex.org/W1562093331","https://openalex.org/W1565494300","https://openalex.org/W1566959760","https://openalex.org/W1660390307","https://openalex.org/W1977841655","https://openalex.org/W1981732427","https://openalex.org/W1982858363","https://openalex.org/W1991360400","https://openalex.org/W2032866865","https://openalex.org/W2059387258","https://openalex.org/W2065472179","https://openalex.org/W2066636486","https://openalex.org/W2072156548","https://openalex.org/W2116504754","https://openalex.org/W2123006679","https://openalex.org/W2125362195","https://openalex.org/W2138662031","https://openalex.org/W2140795521","https://openalex.org/W2146032463","https://openalex.org/W2151361488","https://openalex.org/W2152064096","https://openalex.org/W2154610494","https://openalex.org/W2157405322","https://openalex.org/W2889395214","https://openalex.org/W6633810142","https://openalex.org/W6637101025","https://openalex.org/W6754499842"],"related_works":["https://openalex.org/W4247523873","https://openalex.org/W2979286513","https://openalex.org/W2154688864","https://openalex.org/W2913201029","https://openalex.org/W2158911502","https://openalex.org/W2613215397","https://openalex.org/W1976852594","https://openalex.org/W1997546439","https://openalex.org/W3101598783","https://openalex.org/W1985995549"],"abstract_inverted_index":{"Precomputation":[0],"of":[1,24,49,89,103,116,143,147,168,181,197,225],"common":[2],"term":[3,80,99,107],"co-occurrences":[4,81,115],"has":[5],"been":[6],"successfully":[7],"applied":[8],"to":[9,45,112,137,163,229],"improve":[10],"query":[11,38,50,129,199,226],"performance":[12],"in":[13,34,82,91,125],"large":[14],"scale":[15],"search":[16],"engines":[17],"based":[18],"on":[19,207],"inverted":[20,83],"indexes.":[21,84],"The":[22],"results":[23,54],"such":[25],"precomputations":[26],"are":[27,43,190],"traditionally":[28],"stored":[29],"as":[30,52,192],"additional":[31,149],"posting":[32,111,184],"lists":[33,42,185],"the":[35,47,53,92,114,126,144,148,173,179,198,208,223],"index.":[36,127],"During":[37],"evaluation,":[39,130],"these":[40],"precomputed":[41,64,154,183],"used":[44,136,162],"reduce":[46],"number":[48],"terms,":[51,121],"for":[55,78,106],"multiple":[56],"terms":[57,90],"can":[58,134,159],"be":[59,135,161],"accessed":[60],"through":[61],"a":[62,86,153,215],"single":[63],"list.":[65],"In":[66,151],"this":[67,71],"paper,":[68],"we":[69,94,176],"expand":[70],"paradigm":[72],"by":[73],"considering":[74],"an":[75,204],"alternative":[76],"method":[77,231],"storing":[79],"For":[85],"selected":[87],"set":[88],"index,":[93],"store":[95,113],"bitmaps":[96,133,174],"that":[97,140,188,214],"encode":[98],"co-occurrences.":[100],"A":[101],"bitmap":[102],"size":[104,131],"k":[105,119,132],"t":[108,117],"augments":[109],"each":[110,230],"with":[118],"other":[120],"across":[122],"every":[123],"document":[124],"At":[128],"answer":[138],"queries":[139,165],"involve":[141],"any":[142],"2^k":[145],"combinations":[146],"terms.":[150,170],"contrast,":[152],"list,":[155],"although":[156],"typically":[157],"shorter,":[158],"only":[160],"evaluate":[164,172],"containing":[166],"all":[167],"its":[169],"We":[171,202],"technique":[175],"propose,":[177],"and":[178,186,212],"baseline":[180],"adding":[182],"show":[187,213],"they":[189,193],"complementary,":[191],"capture":[194],"different":[195],"aspects":[196],"evaluation":[200,206,227],"cost.":[201],"perform":[203],"experimental":[205],"TREC":[209],"WT10g":[210],"corpus":[211],"hybrid":[216],"strategy":[217],"combining":[218],"both":[219],"methods":[220],"significantly":[221],"lowers":[222],"cost":[224],"compared":[228],"separately.":[232]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
