{"id":"https://openalex.org/W2073188425","doi":"https://doi.org/10.1145/1458082.1458174","title":"Can phrase indexing help to process non-phrase queries?","display_name":"Can phrase indexing help to process non-phrase queries?","publication_year":2008,"publication_date":"2008-10-26","ids":{"openalex":"https://openalex.org/W2073188425","doi":"https://doi.org/10.1145/1458082.1458174","mag":"2073188425"},"language":"en","primary_location":{"id":"doi:10.1145/1458082.1458174","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1458082.1458174","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th ACM conference on Information and knowledge management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113750084","display_name":"Mingjie Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mingjie Zhu","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China",", University of Science and Technology of China, Hefei, China#TAB#"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":", University of Science and Technology of China, Hefei, China#TAB#","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087920747","display_name":"Shuming Shi","orcid":"https://orcid.org/0000-0001-7018-0682"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuming Shi","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China","Microsoft research Asia, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064573190","display_name":"Nenghai Yu","orcid":"https://orcid.org/0000-0003-4417-9316"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nenghai Yu","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China",", University of Science and Technology of China, Hefei, China#TAB#"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":", University of Science and Technology of China, Hefei, China#TAB#","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025631695","display_name":"Ji-Rong Wen","orcid":"https://orcid.org/0000-0002-9777-9676"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ji-Rong Wen","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China","Microsoft research Asia, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5113750084"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":2.986,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.91147912,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"679","last_page":"688"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8375372886657715},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.809594452381134},{"id":"https://openalex.org/keywords/phrase-search","display_name":"Phrase search","score":0.7809455394744873},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.7728569507598877},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.7175672650337219},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5785446763038635},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5464732050895691},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.46919959783554077},{"id":"https://openalex.org/keywords/factor","display_name":"Factor (programming language)","score":0.4514526128768921},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4506695866584778},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4246484637260437},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.37872248888015747},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.3673008680343628},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.3125806152820587},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2991614043712616},{"id":"https://openalex.org/keywords/web-query-classification","display_name":"Web query classification","score":0.22819867730140686},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.12053048610687256},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.06321516633033752}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8375372886657715},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.809594452381134},{"id":"https://openalex.org/C37202355","wikidata":"https://www.wikidata.org/wiki/Q7188071","display_name":"Phrase search","level":5,"score":0.7809455394744873},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.7728569507598877},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.7175672650337219},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5785446763038635},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5464732050895691},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.46919959783554077},{"id":"https://openalex.org/C2781039887","wikidata":"https://www.wikidata.org/wiki/Q1391724","display_name":"Factor (programming language)","level":2,"score":0.4514526128768921},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4506695866584778},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4246484637260437},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37872248888015747},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.3673008680343628},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.3125806152820587},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2991614043712616},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.22819867730140686},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.12053048610687256},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.06321516633033752},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1458082.1458174","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1458082.1458174","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th ACM conference on Information and knowledge management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W95284390","https://openalex.org/W1535279741","https://openalex.org/W1760082936","https://openalex.org/W1973520416","https://openalex.org/W1977841655","https://openalex.org/W1981732427","https://openalex.org/W1985986751","https://openalex.org/W1991360400","https://openalex.org/W2006608770","https://openalex.org/W2009346361","https://openalex.org/W2019168472","https://openalex.org/W2020919487","https://openalex.org/W2065721358","https://openalex.org/W2066636486","https://openalex.org/W2116504754","https://openalex.org/W2127899914","https://openalex.org/W2134206624","https://openalex.org/W2135050452","https://openalex.org/W2138662031","https://openalex.org/W2139611552","https://openalex.org/W2160484851","https://openalex.org/W2621280964"],"related_works":["https://openalex.org/W4282568653","https://openalex.org/W2919747665","https://openalex.org/W2119380317","https://openalex.org/W2070155952","https://openalex.org/W2082868123","https://openalex.org/W1981732427","https://openalex.org/W2533706070","https://openalex.org/W2129100979","https://openalex.org/W2066869521","https://openalex.org/W2105258824"],"abstract_inverted_index":{"Modern":[0],"web":[1,8],"search":[2,48,100,144],"engines,":[3],"while":[4],"indexing":[5],"billions":[6],"of":[7,36,46,56,73,120,125,136,164,179],"pages,":[9],"are":[10,139],"expected":[11],"to":[12,90,96,151,161,175,201],"process":[13,101,152],"queries":[14,154],"and":[15],"return":[16],"results":[17,183],"in":[18,42,62,69,85,155],"a":[19,63,92,133],"very":[20],"short":[21],"time.":[22],"Many":[23],"approaches":[24],"have":[25],"been":[26,149],"proposed":[27],"for":[28,142,203],"efficiently":[29],"computing":[30],"top-k":[31,76,190],"query":[32,60,198],"results,":[33],"but":[34],"most":[35,72],"them":[37],"ignore":[38],"one":[39],"key":[40],"factor":[41],"the":[43,54,57,74,99,104,116,126,162,167,177,188],"ranking":[44,70],"functions":[45],"commercial":[47],"engines":[49],"-":[50],"term-proximity,":[51],"which":[52,138],"is":[53,67,129,173],"metric":[55],"distance":[58],"between":[59],"terms":[61],"document.":[64],"When":[65],"term-proximity":[66,105],"included":[68],"functions,":[71],"existing":[75,156],"algorithms":[77],"will":[78],"become":[79],"inefficient.":[80],"To":[81],"address":[82],"this":[83,86],"problem,":[84],"paper":[87],"we":[88],"propose":[89],"build":[91],"compact":[93,108],"phrase":[94,109,127,153,171],"index":[95,110,128,147,172],"speed":[97],"up":[98],"when":[102],"incorporating":[103],"factor.":[106],"The":[107,123],"can":[111,195],"help":[112],"more":[113],"accurately":[114],"estimate":[115],"score":[117],"upper":[118],"bounds":[119],"unknown":[121],"documents.":[122],"size":[124],"controlled":[130],"by":[131],"including":[132],"small":[134],"portion":[135],"phrases":[137],"possibly":[140],"helpful":[141],"improving":[143],"performance.":[145],"Phrase":[146],"has":[148],"used":[150,174],"work.":[157],"It":[158],"is,":[159],"however,":[160],"best":[163],"our":[165,193],"knowledge,":[166],"first":[168],"time":[169,200],"that":[170],"improve":[176],"performance":[178],"generic":[180],"queries.":[181],"Experimental":[182],"show":[184],"that,":[185],"compared":[186],"with":[187],"state-of-the-art":[189],"computation":[191],"approaches,":[192],"approach":[194],"reduce":[196],"average":[197],"processing":[199],"1/5":[202],"typical":[204],"setttings.":[205]},"counts_by_year":[{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":5},{"year":2012,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
