{"id":"https://openalex.org/W2913468067","doi":"https://doi.org/10.1109/bigdata.2018.8622177","title":"Exploring Size-Speed Trade-Offs in Static Index Pruning","display_name":"Exploring Size-Speed Trade-Offs in Static Index Pruning","publication_year":2018,"publication_date":"2018-12-01","ids":{"openalex":"https://openalex.org/W2913468067","doi":"https://doi.org/10.1109/bigdata.2018.8622177","mag":"2913468067"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2018.8622177","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2018.8622177","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101735250","display_name":"Juan Rodriguez","orcid":"https://orcid.org/0000-0001-6483-6956"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Juan Rodriguez","raw_affiliation_strings":["Computer Science and Engineering, New York University, Brooklyn, New York, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, New York University, Brooklyn, New York, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074323303","display_name":"Torsten Suel","orcid":"https://orcid.org/0000-0002-8324-980X"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Torsten Suel","raw_affiliation_strings":["Computer Science and Engineering, New York University, Brooklyn, New York, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, New York University, Brooklyn, New York, USA","institution_ids":["https://openalex.org/I57206974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5101735250"],"corresponding_institution_ids":["https://openalex.org/I57206974"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.18418087,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"30","issue":null,"first_page":"1093","last_page":"1100"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.8930284380912781},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.817298173904419},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.7528945207595825},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.7000119686126709},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.6576481461524963},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.47782424092292786},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4655958116054535},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.42235201597213745},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.42147111892700195},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.41304588317871094},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.32172155380249023},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.09223267436027527},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.06571939587593079}],"concepts":[{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.8930284380912781},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.817298173904419},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.7528945207595825},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.7000119686126709},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.6576481461524963},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.47782424092292786},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4655958116054535},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.42235201597213745},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42147111892700195},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.41304588317871094},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.32172155380249023},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.09223267436027527},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.06571939587593079},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2018.8622177","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2018.8622177","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1535624880","https://openalex.org/W1567493457","https://openalex.org/W1969378784","https://openalex.org/W1969840591","https://openalex.org/W1989433773","https://openalex.org/W2002788131","https://openalex.org/W2006997130","https://openalex.org/W2009346361","https://openalex.org/W2022191808","https://openalex.org/W2023268471","https://openalex.org/W2037946039","https://openalex.org/W2062296170","https://openalex.org/W2076685614","https://openalex.org/W2078251464","https://openalex.org/W2116566885","https://openalex.org/W2124921735","https://openalex.org/W2126550498","https://openalex.org/W2127899914","https://openalex.org/W2135290016","https://openalex.org/W2137250554","https://openalex.org/W2584320920","https://openalex.org/W2768348081","https://openalex.org/W2915092747","https://openalex.org/W6669781704","https://openalex.org/W6678084625","https://openalex.org/W6745609711"],"related_works":["https://openalex.org/W2058965144","https://openalex.org/W2164382479","https://openalex.org/W2146343568","https://openalex.org/W98480971","https://openalex.org/W2150291671","https://openalex.org/W2013643406","https://openalex.org/W2027972911","https://openalex.org/W2157978810","https://openalex.org/W2597809628","https://openalex.org/W3046370962"],"abstract_inverted_index":{"Static":[0],"index":[1,8,14,125,133,167,175],"pruning":[2,34,176],"techniques":[3,35],"remove":[4],"postings":[5,41,52,142],"from":[6,101],"inverted":[7],"structures":[9],"in":[10,25,131],"order":[11],"to":[12,49,65,78],"decrease":[13],"size":[15,126,168],"and":[16,61,127,151,158,169],"query":[17,128,170],"processing":[18,129,171],"cost,":[19],"while":[20],"minimizing":[21],"the":[22,80,90,122],"resulting":[23],"loss":[24],"result":[26],"quality.":[27],"A":[28],"number":[29],"of":[30,40,46,68,82,105,147],"authors":[31],"have":[32],"proposed":[33],"that":[36,76,99,110,137,140,159,177],"use":[37],"basic":[38],"properties":[39],"as":[42,44],"well":[43],"results":[45],"past":[47],"queries":[48],"decide":[50],"what":[51],"should":[53],"be":[54],"kept.":[55],"However,":[56],"many":[57],"open":[58],"questions":[59],"remain,":[60],"our":[62],"goal":[63],"is":[64,121,161],"address":[66],"some":[67],"them":[69],"using":[70,143],"a":[71,83,102,116,144,162],"machine":[72],"learning":[73],"based":[74],"approach":[75,98,139],"tries":[77],"predict":[79],"usefulness":[81],"posting.":[84],"In":[85],"this":[86],"paper,":[87],"we":[88],"explore":[89],"following":[91],"questions:":[92],"(1)":[93],"How":[94],"much":[95],"does":[96],"an":[97,138],"learns":[100],"rich":[103,145],"set":[104,146],"features":[106,148],"outperform":[107,155],"previous":[108,156],"work":[109],"uses":[111],"heuristic":[112],"approaches":[113],"or":[114],"just":[115],"few":[117],"features?":[118],"(2)":[119],"What":[120],"relationship":[123],"between":[124,166],"speed":[130,172],"static":[132,174],"pruning?":[134],"We":[135],"show":[136],"prunes":[141],"including":[149],"post-hits":[150],"doc-hits":[152],"can":[153],"significantly":[154],"approaches,":[157],"there":[160],"very":[163],"pronounced":[164],"trade-off":[165],"for":[173],"has":[178],"not":[179],"been":[180],"previously":[181],"explored.":[182]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
